framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,balanced,0.254805326461792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,balanced,0.1629706621170044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,balanced,0.2605280081431071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,balanced,0.4805599848429362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.14981119632720946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.14925440549850463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.2553215980529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,balanced,0.483791987101237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.25375359058380126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,balanced,0.9180533091227213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,balanced,0.4907733201980591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.19792640209197998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.1966528058052063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.46239361763000486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.39548799991607664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,balanced,0.49114668369293213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,balanced,0.9220266342163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.2,0.2847359895706177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,1,power_law_1.01,0.2738687992095947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,balanced,0.49667731920878094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.48200321197509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.438431978225708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,balanced,0.5010079940160116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.2,0.4795328140258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,1,power_law_1.01,0.4765376091003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,balanced,0.9253599643707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.8759807586669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,balanced,0.504858652750651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.8355199813842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.2,0.49205760955810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,1,power_law_1.01,0.479750394821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.9018560409545898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,balanced,0.5089173316955566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,balanced,0.9269493420918783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.878758430480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.2,0.49039998054504397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,balanced,0.512175997098287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.9299136161804199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,1,power_law_1.01,0.4985983848571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,balanced,0.14446933070818582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,balanced,0.5193386475245158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.9326399803161621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,power_law_1.01,0.1434175968170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.2,0.5253568172454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.9397952079772949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,1,power_law_1.01,0.5242815971374511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,balanced,0.5277386506398519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,balanced,0.9325493176778158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,balanced,0.2587466637293498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.9218815803527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,power_law_1.01,0.1912384033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.2,0.5202688217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.9518591880798339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,1,power_law_1.01,0.5250495910644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,balanced,0.5321173270543417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,balanced,0.4864159822463989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,power_law_1.01,0.256115198135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.9606143951416015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.2,0.5331136226654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.9723903656005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,balanced,0.5555946826934814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,1,balanced,0.9381386439005533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,1,power_law_1.01,0.5158016204833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,balanced,0.491706649462382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,power_law_1.01,0.457260799407959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,balanced,0.5680906772613525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.9789695739746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.2,0.5472447872161865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.984006404876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,1,balanced,0.9563893477121989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,1,power_law_1.01,0.5357312202453614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,balanced,0.49379201730092365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,balanced,0.5721333424250284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.2,0.5410048007965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,power_law_1.01,0.46078081130981446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.2,1.0364352226257325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.991487979888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,1,power_law_1.01,0.5412735939025879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,1,balanced,0.9614400068918864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,balanced,0.5015519857406616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,balanced,0.6059573491414388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.2,0.5699711799621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.2,1.1371007919311524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,power_law_1.01,0.5055615901947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,power_law_1.01,1.0707712173461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,1,power_law_1.01,0.5652160167694091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,balanced,0.6809439659118652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,balanced,0.5094399849573771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,1,balanced,0.9830239613850912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.2,1.1285056114196776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.2,0.5883647918701171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,power_law_1.01,0.5619840145111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,power_law_1.01,1.1369088172912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,balanced,0.727674643198649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,1,power_law_1.01,0.5929984092712403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,balanced,0.5142079989115397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,1,balanced,0.9839733441670736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.2,1.1553919792175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,power_law_1.01,0.6028351783752441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.2,0.60763521194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,balanced,0.9428373177846273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,1,power_law_1.01,0.6024127960205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,power_law_1.01,1.2030783653259278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,1,balanced,0.98963729540507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.2,1.2077119827270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.2,0.6302591800689697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,balanced,1.1163466771443684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,1,power_law_1.01,0.6310783863067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,power_law_1.01,1.1883008003234863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.2,1.216038417816162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,1,balanced,1.0451733271280925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.2,0.6263552188873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,1,power_law_1.01,0.6348415851593018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,power_law_1.01,1.224563217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,balanced,1.5734826723734539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,1,balanced,1.051024039586385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.2,1.297049617767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.2,0.7099647998809815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,balanced,0.5207146803538004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,balanced,1.0486133098602295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,1,power_law_1.01,0.7158656120300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.2,1.434879970550537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,1,power_law_1.01,1.2286080360412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,power_law_1.01,0.5766911983489991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.2,0.7929791927337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,balanced,2.0638720194498696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,balanced,1.0851466655731201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.2,1.6817344665527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,1,power_law_1.01,0.800716781616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,balanced,0.5266933441162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,0.9128128051757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,1,power_law_1.01,1.3053248405456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,power_law_1.01,0.5943808078765869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,balanced,1.1735520362854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,balanced,3.08568541208903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.2,2.0277952194213866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,0.8969087600708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,1.183347225189209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,1,power_law_1.01,1.3948863983154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,balanced,1.2200480302174885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.2,2.570822334289551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,1.171116828918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,1.3855039596557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,1,power_law_1.01,1.5733440399169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,balanced,1.5529173215230305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,balanced,4.372399965922038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.2,3.4533119201660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,1.4255616188049316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,1.9321855545043944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,1,power_law_1.01,2.0427711486816404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,balanced,1.8968799908955891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.2,4.426943969726563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,1.92806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,2.4285503387451173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,1,power_law_1.01,2.5355712890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,balanced,2.689253489176432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,balanced,6.583391825358073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.2,6.5268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,2.4764991760253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,3.5930240631103514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,balanced,0.5416053136189779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,1,power_law_1.01,3.5202686309814455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,power_law_1.01,0.575596809387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,balanced,3.536543846130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,3.619033432006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.2,8.870841979980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,balanced,0.5506666501363119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,4.523641586303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,power_law_1.01,0.5969408035278321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,1,power_law_1.01,4.458528137207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,balanced,8.881429036458334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,balanced,0.5627573331197103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,4.567359924316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,balanced,5.38481076558431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,power_law_1.01,0.6202047824859619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,6.632441711425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,balanced,0.580298662185669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.2,13.955859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,1,power_law_1.01,6.695116424560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,power_law_1.01,0.7143487930297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,balanced,0.6107946634292603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,6.688409423828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,power_law_1.01,0.6656000137329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,9.488089752197265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,balanced,7.841077168782552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,1,power_law_1.01,9.055347442626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,balanced,0.6339093446731567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,power_law_1.01,0.7139647960662842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.2,17.48621368408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,balanced,11.42642084757487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,9.425638580322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,power_law_1.01,0.8316479682922363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,balanced,0.6743573347727457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.2,11.885619354248046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,power_law_1.01,1.0728768348693847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,power_law_1.01,13.932127380371094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,balanced,0.9818346500396729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.2,21.722093200683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,1,power_law_1.01,11.831993865966798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.01,1.3074111938476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,1,balanced,11.672325134277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,balanced,1.0439039866129558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.01,1.791801643371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.2,18.917958068847657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,power_law_1.01,17.43306884765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,balanced,1.5506666501363118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.01,2.3251583099365236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,power_law_1.01,18.688595581054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.01,3.2826816558837892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.2,33.53810424804688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,balanced,2.0832266807556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,1,balanced,18.69802729288737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,1,balanced,17.0405756632487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.01,4.297580718994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,power_law_1.01,21.88577880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.2,36.50271301269531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,balanced,3.1290772755940757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.01,6.2804607391357425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,power_law_1.01,36.4890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,balanced,4.1713441212972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.01,8.426060485839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,power_law_1.01,33.68299560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.2,61.511566162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,1,balanced,21.49219258626302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,balanced,6.233205159505208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.01,12.826495361328124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.01,18.15680694580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,balanced,8.32862917582194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,power_law_1.01,62.06852416992187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,1,balanced,36.690452575683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.01,23.38561248779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,balanced,12.52566401163737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,1,balanced,33.065643310546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,power_law_1.01,39.709677124023436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,balanced,17.077723185221355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,balanced,21.850357055664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,power_law_1.01,87.54498291015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,1,balanced,60.423909505208336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,balanced,38.74267323811849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,balanced,92.3102518717448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,balanced,0.2683839996655782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,balanced,0.46080533663431805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,balanced,0.4262506564458211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,balanced,0.8012959957122803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,1,power_law_1.2,0.14323840141296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,balanced,0.8109599749247233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,balanced,1.5575092633565266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,balanced,0.8129386901855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,1,power_law_1.2,0.17950719594955444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,balanced,1.5627999305725098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,1,power_law_1.2,0.2451200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,balanced,0.8134346803029379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,1,power_law_1.2,0.47811198234558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,balanced,1.560933272043864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,balanced,0.822645346323649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.4273087978363037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,1,power_law_1.2,0.4713791847229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,balanced,1.5663092931111653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,balanced,0.8277866840362549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,1,power_law_1.2,0.5018496036529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.6262207984924316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,balanced,0.8365440368652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,balanced,1.569973309834798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,1,power_law_1.2,0.5464704036712646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,balanced,0.8384319941202799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.8750144004821777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,balanced,1.579418659210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,1,power_law_1.2,0.5934207916259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,balanced,0.8421973387400309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,balanced,1.6156959533691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.01,1.5633279800415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,balanced,0.2571360071500142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,balanced,0.8552800019582113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.01,0.24524800777435302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,balanced,1.6232800483703613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.01,1.5602496147155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,balanced,0.41522665818532306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,balanced,0.8659359614054362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,1,power_law_1.2,0.5686207771301269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.01,0.3134912014007568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.01,1.523583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,balanced,1.637349287668864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,balanced,0.7933493455251058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,balanced,0.876319964726766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.01,0.41409921646118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,1,power_law_1.2,0.597324800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.01,1.6608192443847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,balanced,1.656933307647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,balanced,0.7993280092875162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,balanced,0.9046186606089274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.01,0.736729621887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.01,1.645587158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,balanced,1.654863993326823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,balanced,0.8035626411437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,balanced,0.9245226383209229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.01,0.793068790435791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,1,power_law_1.2,0.5768320083618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,balanced,1.7465920448303223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.01,1.6764863967895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,balanced,0.812608003616333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,balanced,0.9227360089619955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.01,0.802182388305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,1,power_law_1.2,0.5962048053741456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,balanced,0.8214666843414307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.01,1.8257152557373046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,balanced,1.760192076365153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.01,0.8798144340515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,balanced,0.9732426802317301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,1,power_law_1.2,0.6422656059265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,balanced,0.8282559712727865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,balanced,1.7642505963643391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.01,1.7637952804565429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.01,0.8828672409057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,balanced,1.0617067019144695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,1,power_law_1.2,0.7007999897003174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.01,1.8783487319946288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.01,0.9130111694335937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,balanced,1.781882603963216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,power_law_1.01,0.22572801113128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,balanced,1.1060160001118977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,1,power_law_1.2,0.6574783802032471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.01,0.9216383934020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.01,1.9572416305541993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,power_law_1.01,0.33061120510101316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,balanced,1.927578608194987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,balanced,1.444719950358073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,1,power_law_1.2,0.715558385848999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,power_law_1.01,0.32718720436096194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.01,0.9066431999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.01,1.8664896011352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,1,power_law_1.2,0.7998464107513428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,balanced,1.7552587191263835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,balanced,0.8378720283508301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,balanced,1.9689812660217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,power_law_1.01,0.7783167839050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.01,0.9198911666870118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.01,1.9159616470336913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,power_law_1.01,0.7829823970794678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,1,power_law_1.2,1.088710403442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,balanced,2.463040033976237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,balanced,2.529690742492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,balanced,0.8464852968851725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.01,0.9758144378662109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,power_law_1.01,0.8304448127746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.01,2.084115219116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.2,1.289510440826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,power_law_1.01,0.9507648468017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.01,0.9574463844299317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,balanced,3.623957316080729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,balanced,3.0996907552083335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.2,1.7968576431274415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.01,2.1100736618041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,power_law_1.01,1.0089280128479003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.01,1.0116479873657227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.2,2.3100799560546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.01,2.346918487548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,balanced,4.522634824117024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,balanced,5.532847722371419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.01,1.0402303695678712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.2,3.2641342163085936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.01,2.7346879959106447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,power_law_1.01,0.9718784332275391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.01,1.066368007659912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,balanced,6.254949569702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.01,3.425120162963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,power_law_1.01,1.0433600425720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,balanced,6.880032221476237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.2,4.2778881072998045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.01,1.2925439834594727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.01,1.4908096313476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.01,4.320051193237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.2,6.307257461547851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,balanced,9.450949350992838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,balanced,0.864192008972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.01,1.9084480285644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,power_law_1.01,0.9313023567199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,balanced,10.852160135904947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.01,5.856198501586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.2,8.388172912597657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,balanced,0.878602663675944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.01,2.3572288513183595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,power_law_1.01,0.969273567199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,balanced,13.405007680257162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.4414527893066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.01,7.502444458007813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,power_law_1.01,1.0400383949279786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.01,3.103993606567383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,balanced,0.893280029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.2,13.05704345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,power_law_1.01,1.1761024475097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.6376192092895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.01,4.397216033935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,balanced,0.917359987894694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,balanced,14.866101582845053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.01,11.805280303955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,power_law_1.01,1.0718208312988282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.7063680171966553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.2,18.023321533203124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.01,6.234355163574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,power_law_1.01,1.1409919738769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,balanced,22.522745768229168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,balanced,0.9603573481241862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,1,power_law_1.2,1.5985024452209473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,power_law_1.01,1.3579008102416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.01,18.115571594238283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.01,8.00811538696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,power_law_1.01,1.6739456176757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,1,power_law_1.2,1.5191360473632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,balanced,0.9864266713460287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.2,23.052537536621095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.01,2.008940887451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,balanced,19.003568013509113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,1,power_law_1.2,1.6499391555786134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.01,12.156998443603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,balanced,1.034511963526408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.01,2.8342655181884764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.01,27.3257080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,1,power_law_1.2,1.6913471221923828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,balanced,26.723673502604168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.01,3.6460800170898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.01,16.598591613769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,1,power_law_1.2,1.6630783081054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,balanced,1.508863925933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,1,power_law_1.2,39.964254760742186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.01,5.227033615112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,1,power_law_1.2,1.7421247482299804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,balanced,1.6141546567281086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,1,power_law_1.2,1.838707160949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.01,6.832998657226563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.01,21.30194549560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.01,37.8973876953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,1,power_law_1.2,1.8123903274536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,balanced,30.014564514160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.01,10.463423919677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,balanced,2.386261304219564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,balanced,39.237536112467446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,1,power_law_1.2,1.8483711242675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,1,power_law_1.2,1.9590719223022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.01,30.345196533203126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,balanced,3.1707894007364907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.01,14.44318084716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,1,power_law_1.2,1.8926591873168945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,1,power_law_1.2,87.69484252929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,1,power_law_1.2,2.0839359283447267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.01,42.351828002929686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,balanced,4.800677299499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,1,power_law_1.2,2.040153694152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.01,23.302444458007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,balanced,6.557088216145833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,1,power_law_1.2,2.182419204711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.01,59.195745849609374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,1,power_law_1.2,2.477734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,balanced,54.82417297363281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.01,32.648684692382815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,balanced,9.842682520548502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,1,power_law_1.2,2.828486442565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.01,56.72684326171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,1,power_law_1.2,3.6379135131835936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,balanced,59.601521809895836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,balanced,13.841850280761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.01,42.36593322753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,1,power_law_1.2,4.565644836425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,1,power_law_1.2,6.259756851196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,balanced,22.6319580078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,1,power_law_1.2,8.234925079345704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,1,power_law_1.2,12.631116485595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.01,110.909130859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,power_law_1.01,72.26608276367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,balanced,32.936378479003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,1,power_law_1.2,16.972032165527345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,balanced,109.6582539876302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,1,power_law_1.2,25.87397155761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,balanced,43.09406026204427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,1,power_law_1.2,32.64720764160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,power_law_1.01,156.0410888671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,1,power_law_1.2,42.12862854003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,balanced,76.70729064941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,1,power_law_1.2,54.00269775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,1,power_law_1.2,103.3520263671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,balanced,168.8788859049479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.23262720108032225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,1,power_law_1.2,0.33817598819732664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,1,power_law_1.2,0.4307712078094482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,1,power_law_1.2,0.8124287605285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,1,power_law_1.2,0.8129152297973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,1,power_law_1.2,0.813811206817627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,1,power_law_1.2,0.8739456176757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,1,power_law_1.2,0.22588160037994384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,1,power_law_1.2,0.8634431838989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,1,power_law_1.2,0.9134271621704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,1,power_law_1.2,0.34701440334320066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,1,power_law_1.2,0.9300928115844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,1,power_law_1.2,0.45211520195007326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,1,power_law_1.2,0.8980863571166993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,1,power_law_1.2,0.7413119792938232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,1,power_law_1.2,0.9309503555297851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,1,power_law_1.2,0.9992064476013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,1,power_law_1.2,0.7826303958892822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,1,power_law_1.2,0.9569536209106445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,1,power_law_1.2,0.8645952224731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,1,power_law_1.2,1.0248191833496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,1,power_law_1.2,1.0510656356811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,1,power_law_1.2,0.9452223777770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,1,power_law_1.2,1.0938624382019042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,1,power_law_1.2,1.0149567604064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,1,power_law_1.2,1.3073280334472657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,1.4280447959899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,1,power_law_1.2,0.9693759918212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,1.8889663696289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,2.2701120376586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,1,power_law_1.2,1.0336640357971192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,3.1653440475463865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,4.397209548950196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,1,power_law_1.2,0.9262335777282715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,balanced,0.3065386613210042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,6.283366394042969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,balanced,0.48719465732574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,1,power_law_1.2,0.9668864250183106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,8.051641845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,balanced,0.9325493176778158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,1,power_law_1.2,1.0316736221313476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,balanced,1.8460267384847004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,1,power_law_1.2,1.1742400169372558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,12.114393615722657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,balanced,3.637989362080892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,1,power_law_1.2,1.075436782836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,1,power_law_1.2,1.1453120231628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,balanced,7.240933100382487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,16.546060180664064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,1,power_law_1.2,1.3080191612243652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,balanced,7.267855962117513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,1,power_law_1.2,1.6681983947753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.2,2.1095039367675783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,1,power_law_1.2,20.722828674316407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,balanced,7.3077437082926435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.2,2.809209632873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,balanced,7.325429280598958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,balanced,0.15845333536465964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.2,3.5578174591064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,balanced,7.34548823038737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,1,power_law_1.2,30.2947509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.2,5.173388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,balanced,0.2706186572710673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,balanced,7.375247955322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.2,6.846367645263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,balanced,0.4965759913126628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,balanced,7.3758290608723955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,balanced,0.9550933043162028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.2,10.346425628662109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,balanced,1.8619893391927083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,balanced,7.421648025512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,balanced,0.2189120054244995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.2629760026931763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.2,14.263130187988281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,balanced,3.7016000747680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,1,power_law_1.2,59.3109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,balanced,0.3041653235753377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,balanced,7.357898712158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,balanced,3.7153600056966147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.4909696102142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,balanced,0.5339893500010172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.5705471992492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.2,23.09040069580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,balanced,7.375408172607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,balanced,3.7175305684407554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,balanced,0.9679413636525472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.01,1.3761216163635255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,balanced,1.8559786478678386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,balanced,3.7340428034464517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,balanced,7.452085494995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.01,2.2661951065063475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,balanced,3.618879954020182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,balanced,3.7357441584269204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.2,31.963687133789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.01,3.268787384033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,balanced,7.4818878173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,balanced,3.6383946736653647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,balanced,3.7552159627278647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.01,4.785958480834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,balanced,3.655461311340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,balanced,7.803418477376302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,balanced,3.767173449198405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,balanced,3.670442581176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.01,5.167052841186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.2,42.25087280273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,balanced,3.6846399307250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.01,5.441715240478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,balanced,3.8009332021077475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,balanced,8.079455693562826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,balanced,3.71285343170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.01,5.687660980224609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,balanced,3.8400001525878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,balanced,3.7403732935587564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.01,5.862464141845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,balanced,8.361370722452799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,balanced,3.873045285542806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,balanced,3.7707414627075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.1779904007911682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.01,6.02782096862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,balanced,3.830512046813965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,1,power_law_1.2,72.13426513671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,balanced,3.911856015523275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.01,0.2774784088134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,balanced,8.5273068745931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.01,6.0497089385986325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,balanced,3.8962720235188804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.01,0.33586559295654295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,balanced,3.9747467041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,balanced,3.9443626403808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.01,6.401542663574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.01,0.737497615814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,balanced,8.887653350830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,balanced,4.050517400105794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.01,6.557894134521485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.01,1.2083071708679198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,balanced,4.052133242289226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.01,1.7716608047485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.01,6.877855682373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,balanced,4.197098731994629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,balanced,9.388437271118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.01,2.5198976516723635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.01,6.993376159667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,power_law_1.01,0.22901759147644044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.01,2.70248966217041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,balanced,4.273674647013347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,balanced,4.278191884358724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.01,7.862175750732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,power_law_1.01,0.3286463975906372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.01,2.8302591323852537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,power_law_1.01,0.3316096067428589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,balanced,9.992666880289713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,1,power_law_1.2,153.5477294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.01,8.246265411376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,balanced,4.536752065022786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.01,2.8459135055541993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,power_law_1.01,0.7423935890197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.01,3.0178176879882814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.01,9.810918426513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,power_law_1.01,1.1764032363891601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,balanced,4.792106628417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.01,3.168659210205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,power_law_1.01,1.744825553894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.01,8.970873260498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.01,3.2328128814697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,balanced,10.7806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,power_law_1.01,2.491072082519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,balanced,4.4975840250651045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.01,10.224134063720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.01,3.3013118743896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,balanced,5.095775922139485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,power_law_1.01,2.6451391220092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.01,3.4436737060546876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.01,10.786361694335938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,balanced,4.887882550557454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,power_law_1.01,2.734003257751465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.01,3.5991424560546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,power_law_1.01,2.802911949157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.01,13.087557983398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,balanced,5.2403519948323565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.01,4.201561737060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,balanced,6.216053644816081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,power_law_1.01,3.0108543395996095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,balanced,13.888720194498697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.01,4.617971038818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,power_law_1.01,3.201772689819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.01,16.03992919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,balanced,6.016826629638672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,4.413363265991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,power_law_1.01,3.398828887939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.01,22.220428466796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,power_law_1.01,3.653401565551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,5.218982315063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,balanced,6.719055811564128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,balanced,6.367200215657552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,power_law_1.01,3.9179454803466798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,4.550495910644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.01,34.075442504882815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,power_law_1.01,4.207136154174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,5.1739967346191404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,balanced,11.042746225992838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,power_law_1.01,4.840729522705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,balanced,29.35473124186198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,5.683456039428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.01,40.46815490722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,7.0428413391113285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,balanced,8.393237431844076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,power_law_1.01,4.885580825805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,8.229299163818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,balanced,12.960309346516928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.01,4.6376384735107425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,11.153510284423827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.01,60.25297241210937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.01,5.62158088684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,14.7046142578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.01,6.528934478759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.01,18.13673553466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,balanced,31.55719502766927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,balanced,10.902581532796225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.01,6.870745849609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,balanced,18.884437561035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.01,8.534809875488282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.01,89.59063110351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.01,23.5936767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.01,11.572978973388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.01,14.998162841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.01,43.82960510253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.01,21.40985565185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,balanced,27.88702392578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,balanced,13.257525126139322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.01,29.33743896484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.01,35.878790283203124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,balanced,55.735636393229164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,balanced,34.78416442871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,power_law_1.01,59.45353393554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,balanced,21.69641621907552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.2639807939529419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.4751488208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,power_law_1.01,123.8720947265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.5616576194763183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,1,power_law_1.2,1.1790271759033204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,1,power_law_1.2,1.988595199584961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,1,power_law_1.2,2.7893632888793944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,1,power_law_1.2,4.684211349487304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,balanced,59.62555440266927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,1,power_law_1.2,4.942617416381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,1,power_law_1.2,5.197081756591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,1,power_law_1.2,5.564038467407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,1,power_law_1.2,5.8836414337158205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,1,power_law_1.2,6.103475189208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,1,power_law_1.2,6.356211090087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,1,power_law_1.2,6.615321350097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,balanced,74.45521545410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,1,power_law_1.2,6.9723968505859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.17761919498443604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,1,power_law_1.2,7.084352111816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,1,power_law_1.2,0.26813440322875975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,1,power_law_1.2,0.31738879680633547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,1,power_law_1.2,7.380563354492187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,1,power_law_1.2,0.6235328197479248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,1,power_law_1.2,1.0220095634460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,1,power_law_1.2,8.083769226074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,1,power_law_1.2,1.4953408241271973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,1,power_law_1.2,2.393363189697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,1,power_law_1.2,9.076652526855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,1,power_law_1.2,2.6336896896362303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,balanced,44.99185689290365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,1,power_law_1.2,2.694272041320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,1,power_law_1.2,10.321158599853515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,1,power_law_1.2,2.841036796569824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,1,power_law_1.2,9.561644744873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,1,power_law_1.2,2.947091293334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,1,power_law_1.2,3.0597888946533205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,1,power_law_1.2,10.606028747558593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,1,power_law_1.2,3.202649688720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,1,power_law_1.2,11.581804656982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,1,power_law_1.2,3.2661182403564455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,1,power_law_1.2,3.500691223144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,1,power_law_1.2,14.502578735351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,1,power_law_1.2,3.5531326293945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,1,power_law_1.2,17.90192565917969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,1,power_law_1.2,4.282643127441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,1,power_law_1.2,4.833049774169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,balanced,121.5578104654948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,1,power_law_1.2,24.66026916503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,4.768652725219726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,5.434246444702149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,4.800076675415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,1,power_law_1.2,31.633145141601563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,5.391059112548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,5.933427047729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,7.445401763916015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,1,power_law_1.2,38.03800964355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,8.590796661376952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,11.654752349853515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,1,power_law_1.2,53.425115966796874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,15.345164489746093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,1,power_law_1.2,18.723033142089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,1,power_law_1.2,0.21823360919952392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,1,power_law_1.2,0.32933759689331055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,balanced,0.05306133131186167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,1,power_law_1.2,22.67888641357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,balanced,0.07365333537260692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,1,power_law_1.2,0.3441472053527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,balanced,0.12452800075213115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,1,power_law_1.2,85.31187133789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,1,power_law_1.2,0.6418560028076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,balanced,0.2262453238169352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,balanced,0.4217919905980428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,1,power_law_1.2,1.0222208023071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,balanced,0.4306666851043701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,balanced,0.4333173433939616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,1,power_law_1.2,1.4186240196228028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,1,power_law_1.2,44.41299743652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,balanced,0.4341653188069661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,balanced,0.4352320035298665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,1,power_law_1.2,2.3427839279174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,balanced,0.4362773497899373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,1,power_law_1.2,2.5150592803955076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,balanced,0.43670399983723956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,balanced,0.4413546721140544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,1,power_law_1.2,2.5885440826416017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,balanced,0.44500799973805744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,1,power_law_1.2,2.8610815048217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,balanced,0.44887999693552655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,1,power_law_1.2,3.0639551162719725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,balanced,0.47068798542022705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,balanced,0.4716586669286092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,1,power_law_1.2,3.330316925048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,balanced,0.49067731698354083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,1,power_law_1.2,3.455769729614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,1,power_law_1.2,3.6805248260498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,balanced,0.517743984858195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,balanced,0.5559999942779541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,1,power_law_1.2,4.049216079711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,balanced,0.600106676419576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,1,power_law_1.2,4.3817790985107425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,balanced,0.6414613326390585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,1,power_law_1.2,4.93804817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,balanced,0.7865386803944906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,1,power_law_1.2,5.114815902709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,balanced,0.040192000567913055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,balanced,0.8836159706115723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,balanced,0.05594133337338766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,balanced,0.08113066852092743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.2,4.9245952606201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,balanced,0.1341333289941152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,balanced,1.1815520127614338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,balanced,0.23266132672627768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,balanced,0.23678932587305704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.2,5.77088623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.2,6.747577667236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,balanced,0.2413653333981832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,balanced,0.2402720053990682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,balanced,1.5026346842447917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.2,7.299180603027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,balanced,0.24127467473347983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,balanced,0.24379199743270874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.2,8.693875122070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,balanced,0.2497653365135193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,balanced,0.25225067138671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.2,11.579942321777343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,balanced,0.25562665859858197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,balanced,2.1404107411702475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,balanced,0.2653706669807434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.2,14.921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,balanced,0.27292799949645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,balanced,0.27613866329193115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.2,21.675704956054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,balanced,0.29545066754023236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,balanced,0.32505067189534503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.2,28.189453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,balanced,0.35013333956400555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,balanced,2.8807252248128257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,balanced,0.4031840165456136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,balanced,0.06515733400980632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.2,34.742593383789064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,balanced,0.4540319840113322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,balanced,0.0717439999183019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,power_law_1.01,0.04811519980430603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,balanced,0.08935466408729553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,power_law_1.01,0.055667197704315184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,balanced,0.1430186629295349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,balanced,0.6074293454488119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,power_law_1.01,0.10280959606170655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,balanced,0.23692800601323447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,balanced,0.24288533131281534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,power_law_1.01,0.14810240268707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,1,power_law_1.2,56.455108642578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,balanced,0.2476373314857483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,power_law_1.01,0.2109760046005249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,balanced,0.7210133075714111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,balanced,0.24945600827534994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,power_law_1.01,0.33960959911346433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,balanced,3.6194559733072915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,balanced,0.2550133268038432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,power_law_1.01,0.35966079235076903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,balanced,0.25837866465250653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,power_law_1.01,0.37740159034729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,balanced,0.2660906712214152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,balanced,1.0166666507720947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,balanced,0.2733386754989624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,power_law_1.01,0.397760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,balanced,0.2797813415527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,power_law_1.01,0.4066751956939697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,power_law_1.01,0.40375680923461915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,balanced,0.2911626696586609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,power_law_1.01,0.40886402130126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,1,power_law_1.2,115.2469482421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,balanced,1.327946662902832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,power_law_1.01,0.42520961761474607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,power_law_1.01,0.4396992206573486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,power_law_1.01,0.03916800022125244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,power_law_1.01,0.4536640167236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,power_law_1.01,0.043699198961257936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,balanced,0.3041440049807231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,power_law_1.01,0.4606143951416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,power_law_1.01,0.06657919883728028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,balanced,0.3158186674118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,power_law_1.01,0.5137152194976806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,power_law_1.01,0.0989247977733612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,balanced,1.9456960360209148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,power_law_1.01,0.569811201095581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,power_law_1.01,0.12300159931182861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,balanced,5.867290496826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,power_law_1.01,0.5635583877563477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,power_law_1.01,0.19505280256271362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,power_law_1.01,0.6279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,power_law_1.01,0.21400320529937744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,power_law_1.01,0.6582911968231201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,power_law_1.01,0.21946239471435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,balanced,0.3513760169347127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,power_law_1.01,0.8073151588439942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,power_law_1.01,0.22421760559082032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,balanced,0.4095413287480672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,power_law_1.01,0.2314687967300415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,power_law_1.01,0.9507455825805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,balanced,2.565605322519938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,balanced,0.4609866539637248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,power_law_1.01,0.23535358905792236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,power_law_1.01,1.2777791976928712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,power_law_1.01,0.24674561023712158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,balanced,0.5935946702957153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,power_law_1.01,1.611180877685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,power_law_1.01,0.2553855895996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,power_law_1.01,2.319718360900879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,balanced,0.6915626525878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,power_law_1.01,0.25992960929870607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,power_law_1.01,0.2735680103302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,power_law_1.01,3.002444839477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,power_law_1.01,0.2795007944107056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,balanced,1.008250633875529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,power_law_1.01,3.753081512451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,power_law_1.01,0.05596799850463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,power_law_1.01,0.2980096101760864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,power_law_1.01,0.06579840183258057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,power_law_1.01,0.33591039180755616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,power_law_1.01,5.592089462280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,power_law_1.01,0.07927039861679078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,balanced,1.2055573463439941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,power_law_1.01,0.36433279514312744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,power_law_1.01,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,balanced,3.1939147313435874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,power_law_1.01,0.43135361671447753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,power_law_1.01,0.13251839876174926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,power_law_1.01,11.706221008300782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,1,power_law_1.2,0.047712001204490664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,power_law_1.01,0.20478079319000245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,power_law_1.01,0.497760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,1,power_law_1.2,0.05783680081367493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,power_law_1.01,0.21512959003448487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,balanced,1.7796907424926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,power_law_1.01,0.6205503940582275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,power_law_1.01,0.22560639381408693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,1,power_law_1.2,0.09200000166893005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,power_law_1.01,0.7680511951446534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,power_law_1.01,0.23143041133880615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,1,power_law_1.2,0.12735999822616578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,power_law_1.01,1.0603648185729981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,power_law_1.01,0.24394240379333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,1,power_law_1.2,0.17161600589752196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,power_law_1.01,0.2606015920639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,power_law_1.01,1.348691177368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,1,power_law_1.2,0.33791360855102537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,balanced,2.3566293716430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,power_law_1.01,0.2637120008468628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,power_law_1.01,1.947078323364258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,1,power_law_1.2,0.3687295913696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,power_law_1.01,0.28063359260559084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,1,power_law_1.2,0.3966655969619751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,power_law_1.01,0.3000511884689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,power_law_1.01,2.5851072311401366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,balanced,11.459439595540365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,1,power_law_1.2,0.39927680492401124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,power_law_1.01,3.184147262573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,1,power_law_1.2,0.40757122039794924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,power_law_1.01,0.30979199409484864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,power_law_1.01,4.915564727783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,balanced,3.4676214853922525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,1,power_law_1.2,0.41407361030578616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,power_law_1.01,0.328108811378479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,balanced,5.083248138427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,1,power_law_1.2,0.4240384101867676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,power_law_1.01,10.176921844482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,1,power_law_1.2,0.4301439762115479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,power_law_1.01,0.3512831926345825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,1,power_law_1.2,0.4422463893890381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,power_law_1.01,0.41495041847229003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,1,power_law_1.2,0.4552639961242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,power_law_1.01,0.4879039764404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,1,power_law_1.2,0.4614272117614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,power_law_1.01,0.6294911861419678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,1,power_law_1.2,0.5194943904876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,balanced,4.602389335632324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,power_law_1.01,0.7635647773742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,1,power_law_1.2,0.5684927940368653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,1,power_law_1.2,0.5616447925567627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,power_law_1.01,1.0350591659545898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,1,power_law_1.2,0.6214655876159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,power_law_1.01,1.3093503952026366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,1,power_law_1.2,0.6850944042205811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,power_law_1.01,1.861337661743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,1,power_law_1.2,0.8292096138000489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,power_law_1.01,2.4277376174926757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,1,power_law_1.2,0.9865407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,power_law_1.01,3.5495487213134767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,1,power_law_1.2,1.3256447792053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,power_law_1.01,4.675872039794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,balanced,5.728421529134114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,1,power_law_1.2,1.6537343978881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,power_law_1.01,5.78455696105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,1,power_law_1.2,2.3485631942749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,1,power_law_1.2,3.114540863037109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,power_law_1.01,9.136128234863282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,1,power_law_1.2,3.8390464782714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,power_law_1.01,18.052928161621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,1,power_law_1.2,5.556172943115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,1,power_law_1.2,11.718291473388671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,balanced,9.842517217000326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,balanced,9.103631973266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,1,power_law_1.2,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,1,power_law_1.2,0.04635519981384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,1,power_law_1.2,0.06347519755363465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,1,power_law_1.2,0.08880640268325805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,1,power_law_1.2,0.11386239528656006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,1,power_law_1.2,0.19805439710617065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,1,power_law_1.2,0.21404800415039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,1,power_law_1.2,0.22028160095214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,1,power_law_1.2,0.2261631965637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,1,power_law_1.2,0.23168001174926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,1,power_law_1.2,0.2410559892654419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,1,power_law_1.2,0.24877440929412842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,1,power_law_1.2,0.2631295919418335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,1,power_law_1.2,0.26353280544281005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,1,power_law_1.2,0.27603199481964114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,balanced,18.104607899983723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,1,power_law_1.2,0.28869760036468506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,1,power_law_1.2,0.30176639556884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,1,power_law_1.2,0.3434112071990967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,1,power_law_1.2,0.37557120323181153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,1,power_law_1.2,0.4351679801940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,1,power_law_1.2,0.5059711933135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,1,power_law_1.2,0.6466368198394775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,1,power_law_1.2,0.7803199768066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,1,power_law_1.2,1.0759807586669923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,1,power_law_1.2,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,1,power_law_1.2,1.3668928146362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,1,power_law_1.2,1.967692756652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,1,power_law_1.2,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,1,power_law_1.2,2.588422393798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,1,power_law_1.2,0.07913600206375122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,1,power_law_1.2,0.09985920190811157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,1,power_law_1.2,3.1927871704101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,1,power_law_1.2,0.11960959434509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,balanced,0.13928533593813577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,1,power_law_1.2,4.955718231201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,1,power_law_1.2,0.2040191888809204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,balanced,0.22355733315149942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,1,power_law_1.2,0.2197567939758301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,balanced,0.42688000202178955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,1,power_law_1.2,10.263251495361327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,balanced,0.8252960046132406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,1,power_law_1.2,0.2310784101486206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,balanced,1.6082347234090169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,1,power_law_1.2,0.24111359119415282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,balanced,1.6109867095947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,1,power_law_1.2,0.2507904052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,1,power_law_1.2,0.25866239070892333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,balanced,1.6212746302286785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,1,power_law_1.2,0.27333118915557864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,balanced,1.6266239484151204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,1,power_law_1.2,0.2854655981063843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,balanced,0.08982933561007182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,balanced,1.6329065958658855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,1,power_law_1.2,0.3066431999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,balanced,1.637994607289632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,balanced,0.12936000029246011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,balanced,1.641690731048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,1,power_law_1.2,0.3145024061203003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,balanced,0.22673600912094116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,balanced,1.6550720532735188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,1,power_law_1.2,0.33496320247650146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,balanced,0.42390398184458417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,balanced,1.666975975036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,balanced,0.8179360230763754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,balanced,1.6786613464355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,1,power_law_1.2,0.3555392026901245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,balanced,0.8222400347391764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,balanced,1.7218613624572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,1,power_law_1.2,0.4198783874511719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,balanced,0.8289653460184733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,1,power_law_1.2,0.49658880233764646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,balanced,1.738591988881429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,balanced,0.8353226979573568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,1,power_law_1.2,0.6385536193847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,balanced,0.8433547019958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,1,power_law_1.2,0.7732672214508056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,balanced,1.796895980834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,balanced,0.8447733720143636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,1,power_law_1.2,1.047430419921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,balanced,1.8349439303080242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,1,power_law_1.2,1.3273280143737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,balanced,0.8525813420613607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,1,power_law_1.2,1.8880447387695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,balanced,1.9278292655944824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,balanced,0.860490640004476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,1,power_law_1.2,2.449087905883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,balanced,0.8754666646321615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,balanced,2.0220212936401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,1,power_law_1.2,3.5755390167236327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,balanced,0.8937333424886068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,1,power_law_1.2,4.673574447631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,balanced,0.9076053301493326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,balanced,2.098735968271891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,1,power_law_1.2,5.808575820922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,balanced,0.9145920276641846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,balanced,0.9359306494394938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,1,power_law_1.2,9.158905792236329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,balanced,2.386927922566732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,balanced,0.9848906993865967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,1,power_law_1.2,18.075596618652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.07930240035057068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,balanced,1.0436960061391194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,balanced,2.587477366129557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.08755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.12260479927062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,balanced,1.1291786829630535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.17834880352020263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.15372159481048583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,balanced,3.3069067001342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,balanced,1.2198293209075928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.01,0.28178560733795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.3165760040283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.472211217880249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.01,0.38243200778961184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,balanced,1.456282615661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.7357056140899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.01,0.6744192123413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.01,0.7068543910980225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.01,1.2842880249023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,balanced,0.0958720048268636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,balanced,5.664106369018555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.01,1.3385024070739746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.01,0.7430592060089112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,balanced,1.6404159863789876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,balanced,0.141157329082489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.01,1.4189824104309081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,balanced,0.23455466826756796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.01,0.7407487869262696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.01,1.445798397064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,balanced,0.42935999234517414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.01,1.4797632217407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.01,0.7855936050415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,balanced,0.8090133666992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,balanced,2.1987627347310386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.01,1.5431615829467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,balanced,0.8190186818440756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.01,0.7944960117340087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,balanced,0.8290879726409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.01,1.608006477355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.01,0.8413951873779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,balanced,0.8383413155873617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,balanced,7.658709208170573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.01,1.6350847244262696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,balanced,0.8476106325785319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.01,0.8444416046142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.01,1.637708854675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,balanced,0.8549280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,balanced,2.861333211263021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.01,1.689632034301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.01,0.9147775650024415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,balanced,0.8691146373748779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.01,1.7302080154418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,balanced,0.8850933710734049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.01,0.9492159843444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.01,1.778758430480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,balanced,0.8974346319834391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.01,0.9734848022460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.01,1.99102725982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,balanced,0.9232107003529867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.01,1.9923519134521483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.01,0.9324031829833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.01,2.085203170776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,balanced,8.28547732035319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.01,1.021951961517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,balanced,4.312602678934733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.01,2.209516716003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,1.0917375564575196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.01,2.7378496170043944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,balanced,0.9526080290476481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,1.257369613647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.01,3.2073535919189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,1.2938752174377441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,balanced,0.9805333614349365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.01,4.163462448120117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,1.6003711700439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.01,5.993209457397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,1.9016895294189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,2.555129623413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.01,8.102310180664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,balanced,5.369653065999349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,3.235647964477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.01,9.857369232177735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,balanced,10.669349670410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,4.53960952758789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.01,12.241535949707032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,6.00561294555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,balanced,1.0581759611765544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.01,18.300218200683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.01,7.496422576904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,balanced,1.1737546920776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,balanced,1.268623987833659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.01,11.269951629638673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,balanced,1.4973972638448079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,power_law_1.01,0.10408320426940917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.01,34.98310546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,balanced,6.920186360677083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,power_law_1.01,0.11549439430236816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,balanced,1.6870613098144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.01,23.938943481445314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,power_law_1.01,0.1976256012916565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,power_law_1.01,0.30303359031677246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,balanced,2.43777068456014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,power_law_1.01,0.3978816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,power_law_1.01,0.6493887901306152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,balanced,2.8293654123942056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,power_law_1.01,0.716428804397583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,balanced,17.90619150797526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,power_law_1.01,0.7645055770874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,power_law_1.01,0.7864895820617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,balanced,4.264058748881022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,power_law_1.01,0.8329407691955566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,power_law_1.01,0.8479616165161132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.12234879732131958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,power_law_1.01,0.8971648216247559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,power_law_1.01,0.9493503570556641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.1460543990135193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,balanced,11.562629699707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,balanced,5.7109120686848955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.28822400569915774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,power_law_1.01,1.0062399864196778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.41685757637023924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.6274687767028808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,power_law_1.01,0.9935423851013183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,1,power_law_1.2,1.304793643951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,1,power_law_1.2,1.347871971130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,power_law_1.01,1.0343168258666993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,1,power_law_1.2,1.4087488174438476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,balanced,8.738565444946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,1,power_law_1.2,1.4545408248901368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,power_law_1.01,1.067084789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,1,power_law_1.2,1.5044672012329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,power_law_1.01,1.2627200126647948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,1,power_law_1.2,1.5728192329406738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,1,power_law_1.2,1.6375999450683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.01,1.4411711692810059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,1,power_law_1.2,1.6953727722167968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.01,1.641561508178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,1,power_law_1.2,1.6753280639648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.01,1.9541248321533202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,1,power_law_1.2,1.7401216506958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.01,2.6036415100097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,balanced,11.792133331298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.01,3.274118423461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,1,power_law_1.2,1.7968191146850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.01,4.653555297851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,1,power_law_1.2,1.8514368057250976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.01,6.004576110839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,1,power_law_1.2,2.0201663970947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.01,8.766175842285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,1,power_law_1.2,1.9534847259521484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.07912319898605347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.01,11.633382415771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.08892160058021545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,1,power_law_1.2,2.1756160736083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,balanced,34.02142333984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.16517759561538697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,1,power_law_1.2,2.3704383850097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.01,14.451385498046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,1,power_law_1.2,0.2439296007156372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,balanced,14.828736623128256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,1,power_law_1.2,2.8470272064208983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,1,power_law_1.2,0.3208767890930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,1,power_law_1.2,3.364672088623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,1,power_law_1.2,0.6845503807067871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,power_law_1.01,23.974969482421876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,1,power_law_1.2,0.7151487827301025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,1,power_law_1.2,4.3612926483154295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,balanced,22.782676696777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,1,power_law_1.2,0.7629439830780029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,1,power_law_1.2,5.84705924987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,1,power_law_1.2,0.7934720039367675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,power_law_1.01,49.40886535644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,1,power_law_1.2,7.903794860839843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,1,power_law_1.2,0.8015872001647949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,1,power_law_1.2,0.8109696388244629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,1,power_law_1.2,10.071392059326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,1,power_law_1.2,0.8567808151245118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,1,power_law_1.2,0.8702527999877929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,1,power_law_1.2,12.31817626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,1,power_law_1.2,0.9193023681640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,1,power_law_1.2,0.9546688079833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,1,power_law_1.2,17.659500122070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,balanced,24.495887756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,1,power_law_1.2,0.9972224235534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,1,power_law_1.2,0.9655039787292481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,1,power_law_1.2,1.0675840377807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,1,power_law_1.2,34.4216064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,1.1263487815856934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,1.2835968017578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,1.3432703971862794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,1.6524543762207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,1.9618303298950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,2.632275199890137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,3.2721790313720702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,4.611308670043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,6.182515335083008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,1,power_law_1.2,7.647007751464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,1,power_law_1.2,11.039615631103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,1,power_law_1.2,0.1028607964515686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,1,power_law_1.2,23.55523223876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,1,power_law_1.2,0.11278719902038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,1,power_law_1.2,0.1737280011177063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,1,power_law_1.2,0.24461441040039061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,1,power_law_1.2,0.34967041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,1,power_law_1.2,0.6904895782470704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,1,power_law_1.2,0.7372288227081298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,1,power_law_1.2,0.784287977218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,balanced,51.502176920572914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,balanced,0.32208534081776935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,1,power_law_1.2,0.7992576122283935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,1,power_law_1.2,0.8377408027648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,balanced,0.5271733204523722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,1,power_law_1.2,0.8734463691711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,balanced,1.001802682876587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,1,power_law_1.2,0.9161279678344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,balanced,1.961967945098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,1,power_law_1.2,0.9630399703979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,balanced,3.9254185358683267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,1,power_law_1.2,1.0330495834350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,balanced,4.858928044637044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,balanced,4.871786753336589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,1,power_law_1.2,1.020742416381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,balanced,4.921530723571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,1,power_law_1.2,1.0669952392578126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,balanced,4.935306549072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,balanced,4.956170717875163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,1,power_law_1.2,1.09933443069458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,balanced,4.916005452473958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,1,power_law_1.2,1.2702719688415527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.2,1.455072021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,balanced,4.933072090148926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.2,1.6852544784545898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,balanced,4.945349375406901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.2,1.9938304901123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,balanced,4.986010551452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.2,2.6396352767944338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,balanced,5.0127518971761065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.2,3.3357822418212892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,balanced,5.164671897888184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.2,4.692800140380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,balanced,5.295962651570638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.2,6.057900619506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,balanced,5.422746658325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.2,8.784921264648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.2,11.653196716308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,balanced,5.474559783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.2,14.388140869140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,balanced,6.919141133626302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,balanced,6.058826446533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,1,power_law_1.2,23.367161560058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,balanced,0.18684800465901694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,balanced,0.29417600234349567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,balanced,11.891663869222006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,balanced,0.5433386564254761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,balanced,1.047221342722575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,1,power_law_1.2,47.83838806152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,balanced,6.681018829345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,balanced,2.0654613176981607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,balanced,2.562719980875651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,balanced,2.5764427185058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,balanced,2.59061861038208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,balanced,12.072954813639322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,balanced,2.597760041554769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,balanced,2.6028854052225747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,balanced,2.6311519940694175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,balanced,2.628330707550049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,balanced,11.55289077758789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,balanced,0.20661866664886475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,balanced,2.668858528137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,balanced,0.3015893300374349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,balanced,2.6813281377156577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.2843839883804321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,balanced,0.5419626633326212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.4610176086425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,balanced,2.718421300252279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,balanced,1.0193119843800862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.70415358543396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,balanced,2.7471841176350913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,balanced,1.9643093744913738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.01,1.414527988433838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,balanced,2.452218691507975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,balanced,2.8096745808919272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,balanced,18.05606969197591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.01,1.9952512741088868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,balanced,2.466757297515869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,balanced,2.8573118845621743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.01,3.6530494689941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,balanced,2.4840052922566733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,balanced,2.499882698059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,balanced,2.959925333658854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.01,3.802899169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.17226239442825317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,balanced,2.5137279828389487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.01,4.001478576660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,balanced,3.969440142313639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,balanced,2.536191940307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.01,4.1852672576904295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.01,0.266592001914978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,balanced,2.56496000289917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.01,0.38309760093688966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.01,4.266022491455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,balanced,3.264277458190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.01,0.6974207878112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,balanced,2.5897812843322754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.01,4.3552192687988285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.01,1.0129280090332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,balanced,34.82804870605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.01,4.5083263397216795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,balanced,5.7324479420979815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.01,1.786515235900879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,balanced,2.641285260518392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.01,2.0100992202758787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.01,4.5920768737792965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.01,2.0614208221435546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.01,4.789113616943359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,balanced,2.7027413050333657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,balanced,3.8269707361857095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.01,2.124287986755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.01,5.176275253295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.01,2.2222272872924806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.01,5.404051208496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.01,2.313920021057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.01,5.269209671020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,balanced,6.399824142456055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.01,2.3344255447387696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,balanced,2.7574081420898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.01,5.846451187133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.01,2.394764709472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.01,2.401523208618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.01,7.075244903564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.01,2.517919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,balanced,39.16739145914713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.01,2.636537551879883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.01,8.885298919677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,balanced,6.955221176147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.01,2.6990400314331056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.01,2.9565439224243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.01,8.777247619628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,balanced,2.8607041041056314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,3.225177764892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.01,11.305484771728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,3.6396865844726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,4.108569717407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.01,9.301811218261719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,5.011833572387696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,balanced,10.389045079549154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.01,11.428639984130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,4.867967987060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.2843839883804321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,power_law_1.01,0.20016000270843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,6.0759937286376955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.01,13.345004272460937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.3613248109817505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,power_law_1.01,0.30531840324401854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.671449613571167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,7.242495727539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,power_law_1.01,0.39758079051971434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,balanced,3.0715039571126304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,1,power_law_1.2,1.216044807434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.01,17.599110412597657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,power_law_1.01,0.711078405380249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,1,power_law_1.2,1.7758272171020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,9.63017578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,power_law_1.01,1.074777603149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,balanced,3.2483625411987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,power_law_1.01,1.8140735626220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,1,power_law_1.2,3.5105857849121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.01,33.159942626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,power_law_1.01,2.011494445800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,balanced,3.6049013137817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,1,power_law_1.2,3.848953628540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,13.669247436523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,balanced,12.712362925211588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,power_law_1.01,2.14007682800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,1,power_law_1.2,4.150291061401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,balanced,65.53537495930989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,power_law_1.01,2.192870330810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,balanced,3.9532480239868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.01,16.653074645996092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,1,power_law_1.2,4.40716781616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,power_law_1.01,2.286636734008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.01,39.92741088867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,1,power_law_1.2,4.398566436767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,power_law_1.01,2.4230783462524412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,power_law_1.01,2.6602048873901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,1,power_law_1.2,4.533203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,balanced,5.885861078898112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.01,25.70972900390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,power_law_1.01,2.773734474182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,1,power_law_1.2,4.744243240356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,power_law_1.01,3.046739196777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,1,power_law_1.2,4.904870223999024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,power_law_1.01,3.377862548828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,balanced,6.901466369628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.01,61.51474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,1,power_law_1.2,5.035654449462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.01,41.2304443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,1,power_law_1.2,5.363014221191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,balanced,14.518421173095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,power_law_1.01,3.112691116333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,1,power_law_1.2,5.4917247772216795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,balanced,10.782821655273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,1,power_law_1.2,5.48455696105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,power_law_1.01,3.421491241455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.01,71.18472290039062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,1,power_law_1.2,6.071110534667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,1,power_law_1.2,7.316172790527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,power_law_1.01,3.429548645019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,1,power_law_1.2,8.959238433837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,balanced,15.318864186604818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.01,3.8875328063964845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.01,3.9902976989746093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,1,power_law_1.2,9.001074981689452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.01,4.693772888183593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,1,power_law_1.2,11.318227386474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.01,6.148460769653321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,1,power_law_1.2,9.640518188476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.01,7.648384094238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,1,power_law_1.2,11.600704193115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,balanced,22.086331685384113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,balanced,26.274709065755207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.01,11.020070648193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,1,power_law_1.2,13.763699340820313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.17450239658355712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.01,14.553535461425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,1,power_law_1.2,0.18154879808425903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,1,power_law_1.2,18.218150329589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,1,power_law_1.2,0.375052809715271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,1,power_law_1.2,0.5937471866607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.01,21.982392883300783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,1,power_law_1.2,0.9045568466186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,1,power_law_1.2,30.212997436523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,balanced,67.73475646972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,1,power_law_1.2,1.8429695129394532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.01,29.7135498046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,1,power_law_1.2,2.08538875579834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,balanced,31.893643697102863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,1,power_law_1.2,36.877996826171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,1,power_law_1.2,2.109542465209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,1,power_law_1.2,2.2390975952148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.01,37.25804138183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,1,power_law_1.2,2.2176191329956056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,1,power_law_1.2,53.53785400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,1,power_law_1.2,2.356332778930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,1,power_law_1.2,2.4296255111694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,1,power_law_1.2,2.4720575332641603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,power_law_1.01,60.95762329101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,1,power_law_1.2,2.5480064392089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,1,power_law_1.2,2.593356704711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,balanced,38.753936767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,1,power_law_1.2,2.731078338623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,1,power_law_1.2,70.4941650390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,1,power_law_1.2,2.8402624130249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,1,power_law_1.2,3.1261247634887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,3.2703487396240236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,3.8326465606689455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,power_law_1.01,125.58099365234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,4.166291046142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,5.110348892211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,balanced,43.44586181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,5.000576019287109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,6.165139389038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,7.420076751708985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,9.686892700195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,balanced,65.6743672688802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,13.449049377441407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,1,power_law_1.2,16.622918701171876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,1,power_law_1.2,24.8176513671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,1,power_law_1.2,41.41630859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,balanced,0.3081013361612956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,balanced,0.4891466697057088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,1,power_law_1.2,0.20108799934387206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,balanced,0.9370666344960531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,1,power_law_1.2,0.20894720554351806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,balanced,1.8626453081766765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,1,power_law_1.2,0.3885567903518677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,balanced,3.675845464070638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,1,power_law_1.2,0.6194496154785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,1,power_law_1.2,0.8818240165710449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,balanced,7.297920227050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,1,power_law_1.2,1.759667205810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,balanced,10.893077850341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,1,power_law_1.2,2.029248046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,balanced,138.65823364257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,1,power_law_1.2,2.097804832458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,balanced,10.913973490397135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,1,power_law_1.2,2.1703296661376954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,balanced,10.92300796508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,1,power_law_1.2,2.3367551803588866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,balanced,10.942432403564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,1,power_law_1.2,2.5120384216308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,balanced,10.933216094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,1,power_law_1.2,2.7047679901123045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,1,power_law_1.2,2.868921661376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,balanced,11.016000111897787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,1,power_law_1.2,3.1676095962524413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,balanced,11.062479654947916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,1,power_law_1.2,3.3558017730712892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,balanced,10.913200378417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,balanced,10.956053415934244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,1,power_law_1.2,3.1374208450317385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,balanced,11.008293151855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,balanced,10.966475168863932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,1,power_law_1.2,3.401337432861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,balanced,0.17841599384943643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,balanced,0.2723360061645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,balanced,11.107418060302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,balanced,0.49963200092315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,1,power_law_1.2,3.48076171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,balanced,0.9586026668548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,balanced,11.594757080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,balanced,1.8705546061197917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.2,3.9199295043945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,balanced,3.6919733683268228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.2,4.1173759460449215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,balanced,12.004895528157553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.2,4.770150375366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,balanced,5.545162836710612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.2,6.167808151245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,balanced,5.532079696655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,balanced,12.359573364257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.2,7.699231719970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,balanced,5.543962478637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,balanced,5.634208043416341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.2,10.771711730957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,balanced,13.018399556477865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,balanced,5.616517384847005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.2,14.01898193359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,balanced,5.630645116170247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,balanced,5.649530410766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,balanced,13.434623718261719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.2,20.796319580078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,balanced,5.663349151611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,balanced,5.734202702840169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.2,28.030291748046874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.26591360569000244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,balanced,5.775562922159831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,balanced,14.182239532470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.48911361694335936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,balanced,5.800522486368815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.9331328392028808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.2,35.39322204589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,balanced,0.24358399709065756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.01,1.2940223693847657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,balanced,5.981797536214192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,balanced,0.3211466670036316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.01,2.646342468261719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.1792512059211731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,balanced,6.058970769246419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,balanced,14.643845876057943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,balanced,0.5322879950205485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.01,4.120102310180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,balanced,0.9782719612121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.01,0.27733759880065917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,1,power_law_1.2,58.307989501953124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,balanced,6.315680185953776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,balanced,1.8623520533243816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.01,4.900543975830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.01,0.5107327938079834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,balanced,3.6275466283162436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.01,6.649619293212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,balanced,6.458799997965495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.01,0.6525248050689697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,balanced,5.391690572102864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.01,1.3752256393432618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.01,7.113414764404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,balanced,5.40882682800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,balanced,15.947893778483072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,balanced,6.83568000793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.01,2.138540840148926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,balanced,5.429808298746745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.01,7.212665557861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.01,2.621433639526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,balanced,5.442277272542317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.01,7.66144027709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.01,3.4826496124267576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,balanced,7.154970804850261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,balanced,5.471893310546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,1,power_law_1.2,119.3363525390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.01,7.948902130126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,balanced,5.506170908610026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.01,3.6495742797851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.01,7.901958465576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,balanced,5.5382506052653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.01,3.80120964050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,balanced,7.818101247151692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,balanced,5.603504180908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.01,8.387071990966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.01,3.9734142303466795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,balanced,26.516382853190105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,balanced,5.67305056254069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.01,4.180704116821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.01,8.480723571777343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,balanced,5.724165598551433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.01,4.377017593383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.01,8.826092529296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,power_law_1.01,0.25416319370269774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,balanced,5.843690872192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,balanced,8.408666610717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.01,4.758809661865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.01,9.258956909179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,power_law_1.01,0.3578687906265259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,balanced,6.078927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.01,5.051417541503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.01,9.826361846923827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,power_law_1.01,0.5776383876800537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.01,5.441632080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,power_law_1.01,0.690009593963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.01,12.898104858398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.01,5.046988677978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,power_law_1.01,1.3680447578430175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,power_law_1.01,2.0372800827026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,balanced,9.77026112874349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.01,5.441305541992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.01,15.659500122070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,balanced,6.296794891357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,power_law_1.01,2.5106176376342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,balanced,45.6416982014974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,6.601657867431641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,power_law_1.01,3.3568382263183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.01,15.548883056640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,7.891916656494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,power_law_1.01,3.596486282348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,power_law_1.01,3.7117504119873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,7.275878143310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.01,20.032345581054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,power_law_1.01,3.859385681152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,9.078675079345704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,power_law_1.01,4.107372665405274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.01,16.022866821289064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,power_law_1.01,4.330054473876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,balanced,12.507476806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,balanced,6.765439987182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,7.449113464355468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,power_law_1.01,4.604473495483399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.01,19.831590270996095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,8.543981170654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,balanced,7.157503763834636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,power_law_1.01,5.01011848449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.01,18.504293823242186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,10.263155364990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,power_law_1.01,5.293254470825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,balanced,7.885904312133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,power_law_1.01,5.911552047729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,12.966470336914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.01,22.860806274414063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,power_law_1.01,7.2079612731933596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,balanced,8.73639996846517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,15.835250854492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,balanced,39.82033030192057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.01,39.38359680175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.01,7.004390716552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,balanced,18.14473597208659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.01,19.17164764404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,balanced,10.271727879842123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.2661312103271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.01,6.960832214355468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.01,45.09480285644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.01,26.48729553222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.6337664127349854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.01,8.01488037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,1,power_law_1.2,1.2252415657043456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,1,power_law_1.2,2.2674943923950197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,balanced,16.829493204752605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.01,10.054163360595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,1,power_law_1.2,3.444723129272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.01,46.37894287109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.01,47.355859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,1,power_law_1.2,4.148704147338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.01,9.672383880615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,1,power_law_1.2,6.424896240234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.01,13.002188110351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,1,power_law_1.2,6.683251190185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,1,power_law_1.2,7.075827026367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,balanced,20.27977116902669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.01,16.40723876953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,1,power_law_1.2,7.373772430419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,balanced,22.291590372721355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,1,power_law_1.2,7.718739318847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.01,23.603981018066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.01,118.7379150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,1,power_law_1.2,8.16792984008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,1,power_law_1.2,8.46060791015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.01,30.687725830078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,1,power_law_1.2,8.650214385986327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,1,power_law_1.2,8.955974578857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,balanced,29.807729085286457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,1,power_law_1.2,9.321900939941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.01,38.45168762207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,1,power_law_1.2,10.432038116455079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,1,power_law_1.2,12.961030578613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,1,power_law_1.2,15.78775634765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,balanced,78.58030192057292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,power_law_1.01,61.407196044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,1,power_law_1.2,16.40662384033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,1,power_law_1.2,20.70569610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,balanced,40.096832275390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,1,power_law_1.2,16.1727294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,1,power_law_1.2,19.822329711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,power_law_1.01,126.2141845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,1,power_law_1.2,19.789830017089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,1,power_law_1.2,23.562643432617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,balanced,47.12114969889323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,1,power_law_1.2,38.89432983398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.17763199806213378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,1,power_law_1.2,0.2698368072509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,balanced,62.9608154296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,1,power_law_1.2,43.657049560546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,1,power_law_1.2,0.33838720321655275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,1,power_law_1.2,0.6666687965393067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,1,power_law_1.2,1.0965312004089356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,1,power_law_1.2,44.70652770996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,1,power_law_1.2,1.7774911880493165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,1,power_law_1.2,2.1559680938720702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,1,power_law_1.2,3.243660736083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,1,power_law_1.2,3.450649642944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,1,power_law_1.2,3.543507385253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,1,power_law_1.2,103.58914794921876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,1,power_law_1.2,3.717753601074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,1,power_law_1.2,3.9775489807128905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,1,power_law_1.2,4.124211120605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,1,power_law_1.2,4.647513580322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,1,power_law_1.2,5.019737625122071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,1,power_law_1.2,5.335110473632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,1,power_law_1.2,5.074745559692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,1,power_law_1.2,5.699827194213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,6.986700439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,7.970073699951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,7.626630401611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,9.56833267211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,7.842726135253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,balanced,131.2564697265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,9.279743957519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,10.584397125244141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,12.958502197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,1,power_law_1.2,0.25276799201965333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,18.203782653808595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,1,power_law_1.2,0.36499838829040526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,1,power_law_1.2,0.42580480575561525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,1,power_law_1.2,20.95836181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,1,power_law_1.2,0.7170623779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,1,power_law_1.2,1.2273344039916991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,1,power_law_1.2,25.281138610839843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,1,power_law_1.2,1.7985984802246093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,1,power_law_1.2,2.271808052062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,1,power_law_1.2,3.294841766357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,1,power_law_1.2,49.980856323242186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,1,power_law_1.2,3.487315368652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,1,power_law_1.2,3.4497215270996096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,1,power_law_1.2,4.000102233886719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,1,power_law_1.2,4.154252624511718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,1,power_law_1.2,4.345305633544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,1,power_law_1.2,4.757376098632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,1,power_law_1.2,5.149580764770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,1,power_law_1.2,5.49183349609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,balanced,0.10452266534169515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,power_law_1.2,0.10212479829788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,1,power_law_1.01,0.10207359790802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,1,power_law_1.2,6.136486434936524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,1,power_law_1.2,7.241011047363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.2,7.080147552490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,balanced,0.13125866651535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,power_law_1.01,0.1299456000328064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,1,power_law_1.2,0.12956160306930542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.2,7.420671844482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,balanced,0.10214933753013611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.2,8.38745574951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,power_law_1.01,0.09896320104598999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,power_law_1.01,0.14781440496444703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,balanced,0.1929546594619751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,1,power_law_1.2,0.1444607973098755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.2,10.469971466064454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,balanced,0.13061867157618204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,power_law_1.01,0.11733759641647339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.2,10.178630065917968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,balanced,0.2160053253173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,power_law_1.01,0.1863808035850525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,1,power_law_1.2,0.17616000175476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,balanced,0.18552533785502115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.2,12.943807983398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,power_law_1.01,0.15300480127334595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.2,15.95098876953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,balanced,0.2143519918123881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,power_law_1.01,0.12617599964141846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.2,21.330221557617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,balanced,0.3275360067685445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,power_law_1.01,0.23797760009765626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,1,power_law_1.2,0.20409600734710692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.2,29.086004638671874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,balanced,0.18894400199254355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,power_law_1.2,0.2740864038467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,power_law_1.01,0.2906496047973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,1,balanced,0.6123786767323812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,power_law_1.01,0.18152320384979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,balanced,0.19084266821543375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,power_law_1.01,0.18520959615707397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.2,36.39726867675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,balanced,0.1913813352584839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,power_law_1.01,0.18818559646606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,power_law_1.01,0.20505599975585936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,balanced,0.191103994846344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,balanced,0.6152106523513794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,power_law_1.01,0.42693119049072265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,1,power_law_1.2,0.42709760665893554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,power_law_1.01,0.21322879791259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,balanced,0.6162399848302206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,balanced,0.19218667348225912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,power_law_1.01,0.46465277671813965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,1,power_law_1.2,0.4476607799530029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,1,power_law_1.2,59.00490112304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,1,power_law_1.2,0.10007679462432861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,power_law_1.01,0.2350912094116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,balanced,0.19324266910552979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,1,power_law_1.2,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,1,power_law_1.2,0.13100160360336305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,power_law_1.01,0.26584959030151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,balanced,0.19356799125671387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,1,power_law_1.2,0.11793919801712036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,balanced,0.6179146766662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,power_law_1.01,0.4689792156219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,1,power_law_1.2,0.4763199806213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,1,power_law_1.2,0.18055039644241333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,balanced,0.6223253409067789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,power_law_1.01,0.49354238510131837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,1,power_law_1.2,0.18398720026016235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,1,power_law_1.2,0.48339200019836426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,1,power_law_1.2,0.19857280254364013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,1,power_law_1.2,0.20745599269866943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,1,power_law_1.2,0.2188096046447754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,balanced,0.15135467052459717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,balanced,0.20667733748753866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,balanced,0.6238346497217814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,1,power_law_1.2,0.23416318893432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,power_law_1.01,0.2465536117553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,1,power_law_1.2,124.16849365234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,power_law_1.2,0.5329535961151123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,balanced,0.2574293414751689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,1,power_law_1.01,0.5206975936889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,1,power_law_1.2,0.2611776113510132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,1,power_law_1.2,0.25615360736846926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,balanced,0.4773600101470947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,power_law_1.01,0.27525761127471926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,power_law_1.2,0.27714560031890867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,1,balanced,0.2076479991277059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,balanced,0.483791987101237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,balanced,0.6271040042241415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,balanced,0.4827359914779663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,power_law_1.2,0.5453760147094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,1,power_law_1.01,0.5362624168395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,power_law_1.01,0.3065023899078369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,balanced,0.20970666408538818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,1,power_law_1.2,0.3075648069381714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,balanced,0.4835413297017415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,balanced,0.48559999465942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,balanced,0.48880000909169513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,balanced,0.6293173233668009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,balanced,0.5039093494415283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,power_law_1.2,0.5906112194061279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,1,power_law_1.01,0.5579584121704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,balanced,0.5053120056788126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,balanced,0.5110506614049276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,power_law_1.2,0.3542975902557373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,power_law_1.01,0.3548352003097534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,1,balanced,0.26121066013971966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,balanced,0.6359573205312093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,balanced,0.5132693449656168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,power_law_1.2,0.666476821899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,balanced,0.5143200159072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,1,power_law_1.01,0.6229119777679444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,power_law_1.2,0.3744704008102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,power_law_1.01,0.3716415882110596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,1,balanced,0.2621333400408427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,balanced,0.5510559876759847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,balanced,0.5518186489741007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,balanced,0.6427306731541952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,balanced,0.5541119972864786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,power_law_1.2,0.7248576164245606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,power_law_1.2,0.44167680740356446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,power_law_1.01,0.41313920021057127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,1,balanced,0.26600533723831177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,balanced,0.5727253357569376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,1,power_law_1.01,0.6820032119750976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,balanced,0.6088800032933553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,balanced,0.5396480162938436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,power_law_1.2,0.7739327907562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,1,power_law_1.01,0.7805952072143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,balanced,0.635968009630839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,balanced,0.647050658861796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,power_law_1.2,0.7975808143615722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,balanced,0.8556000391642252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,1,power_law_1.01,0.7499072074890136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,power_law_1.2,0.9263872146606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,power_law_1.01,0.8938048362731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,1,balanced,0.5463306506474813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,balanced,0.9635413487752279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,balanced,1.3851626714070637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,balanced,0.6562773386637369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,power_law_1.2,0.9352383613586426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,power_law_1.2,1.1482368469238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,balanced,1.025055964787801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,1,power_law_1.01,1.1244799613952636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,balanced,1.8121546109517415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,1,power_law_1.01,0.895359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,power_law_1.2,1.3590592384338378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,balanced,1.0347039699554443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,1,power_law_1.01,1.3678272247314454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,balanced,2.67740790049235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,power_law_1.2,1.860620880126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,balanced,3.6222187678019204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,power_law_1.01,1.8692800521850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,1,balanced,1.5295039812723796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,balanced,0.706442674001058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,power_law_1.2,0.9702912330627441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,1,power_law_1.01,0.910860824584961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,power_law_1.2,2.3548864364624023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,power_law_1.01,2.348582458496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,balanced,5.74729601542155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,1,balanced,2.0393013954162598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,power_law_1.2,1.13505277633667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,balanced,0.7156426906585693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,power_law_1.2,3.3631553649902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,power_law_1.01,3.3281856536865235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,1,balanced,3.002922693888346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,1,power_law_1.01,1.0943679809570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,balanced,7.768304189046224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,power_law_1.2,4.297983932495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,power_law_1.01,4.281606292724609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,1,balanced,3.9757439295450845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,balanced,9.879685084025065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,power_law_1.2,6.192742538452149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,power_law_1.01,6.204345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,1,balanced,5.915946960449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,power_law_1.2,1.4384896278381347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,power_law_1.01,1.3331904411315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,1,balanced,0.9492853482564291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,power_law_1.01,8.18896026611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,power_law_1.2,8.1587646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,balanced,16.69607416788737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,1,balanced,7.883951822916667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,power_law_1.2,1.633184051513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,power_law_1.01,1.5190208435058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,power_law_1.2,10.052857971191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,power_law_1.01,10.137490844726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,1,balanced,0.9643306732177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,power_law_1.2,3.0742656707763674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,power_law_1.2,15.939961242675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,power_law_1.01,15.924826049804688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,power_law_1.01,2.920876884460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,1,balanced,2.0118932723999023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,1,balanced,9.821322758992514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,balanced,30.353599548339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,power_law_1.2,32.05528869628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,power_law_1.01,31.833221435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,power_law_1.2,3.57891845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,power_law_1.01,3.4671424865722655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,balanced,0.09870933492978413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,1,balanced,2.050442695617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,balanced,0.15078399578730264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,power_law_1.2,4.611808013916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,balanced,0.2696160078048706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,balanced,3.9171787897745767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,1,power_law_1.01,4.382976150512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,1,balanced,15.660394032796225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,balanced,0.2720426718393962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,balanced,0.2717493375142415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,balanced,0.275221327940623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,power_law_1.2,5.486675262451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,balanced,0.2770933310190837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,power_law_1.01,5.358835220336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,1,balanced,4.018944104512532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,balanced,0.278714656829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,balanced,0.2789226571718852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,balanced,0.28411199649175006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,balanced,0.2834826707839966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,power_law_1.2,7.532025909423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,power_law_1.01,7.3040000915527346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,balanced,0.2862666646639506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,1,balanced,5.937589645385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,balanced,0.2901386618614197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,balanced,0.2951146761576335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,balanced,0.31225067377090454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,power_law_1.2,9.30478744506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,power_law_1.01,9.134521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,1,balanced,7.963621139526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,balanced,0.31506667534510296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,balanced,0.3340959946314494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,1,balanced,31.73785146077474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,balanced,0.3858826557795207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,balanced,0.38971734046936035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,power_law_1.2,11.312351989746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,power_law_1.01,11.069369506835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,balanced,0.5227359930674235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,1,balanced,9.851055781046549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,balanced,0.5955679814020792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,balanced,0.8471733729044596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,power_law_1.2,17.306585693359374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,power_law_1.01,16.954713439941408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,balanced,1.1249279975891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,balanced,1.6415200233459473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,power_law_1.2,33.038937377929685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,power_law_1.01,32.97676086425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,1,balanced,15.585653940836588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,balanced,2.5003840128580728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,balanced,3.7437171936035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,balanced,4.135178565979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,balanced,5.184853235880534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,balanced,9.298432032267252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,1,balanced,31.83233642578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,balanced,19.353722890218098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.14897279739379882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.01,0.18910720348358154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.16316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.01,0.21006720066070556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.15104639530181885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.01,0.32274560928344725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.26439039707183837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.01,0.47918081283569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.01,0.2648063898086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.01,0.4806848049163818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.01,0.27393920421600343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.01,0.4933504104614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.01,0.2781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.01,0.5508800029754639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.01,0.28336639404296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,balanced,0.08805333574612935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.01,0.5669248104095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.01,0.6293824195861817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.01,0.2999232053756714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,balanced,0.14331733187039694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.01,0.6683775901794433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.01,0.30405120849609374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,balanced,0.2511199911435445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.01,0.5508351802825928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.01,0.29180159568786623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,balanced,0.25571733713150024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.01,0.6005055904388428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.01,0.31175038814544676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,balanced,0.25775466362635296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.01,0.31637120246887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.01,0.5755263805389405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,balanced,0.262442668279012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.01,0.37077760696411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.01,0.6238656044006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,balanced,0.2650559941927592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.01,0.40381441116333006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.01,0.6700352191925049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,balanced,0.2669653296470642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.01,0.4993599891662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.01,0.6822527885437012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.01,0.38232319355010985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.01,0.6973055839538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.01,0.4911231994628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.01,0.8830911636352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,0.6177152156829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.01,1.0196415901184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,0.9299712181091309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.01,1.5480704307556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,balanced,0.26983465751012164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,0.9880000114440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.01,1.787923240661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,1.1804224014282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,balanced,0.2733866572380066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.01,2.263398361206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,1.8811712265014648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,2.6472768783569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.01,3.112454414367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,power_law_1.01,0.14168319702148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,3.702489471435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.01,4.767686462402343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,power_law_1.01,0.1546175956726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,6.624082946777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,power_law_1.01,0.13190399408340453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.01,6.3941505432128904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,power_law_1.01,0.24588160514831542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,6.474976348876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.01,9.569017791748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,balanced,0.28150399525960285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,power_law_1.01,0.25824000835418703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.01,7.007622528076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,power_law_1.01,0.2828736066818237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,balanced,0.28620266914367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.01,14.618643188476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,power_law_1.01,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,balanced,0.29293866952260333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.01,14.701632690429687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,power_law_1.01,0.3129535913467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,balanced,0.3001546661059062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.01,14.695712280273437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,balanced,0.31994666655858356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.01,25.705831909179686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,balanced,0.32734400033950806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,power_law_1.01,0.3177792072296143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.01,27.55572509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,balanced,0.3429119984308879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,power_law_1.01,0.31400959491729735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,balanced,0.47763200600941974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.23606400489807128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.14929280281066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,balanced,0.5151626666386923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,2,power_law_1.2,0.2581376075744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,balanced,0.7531039714813232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,power_law_1.01,0.3181823968887329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.01,46.586328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,2,power_law_1.2,0.29760639667510985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.16239360570907593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,balanced,1.0107999642690022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,power_law_1.01,0.34028160572052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,2,power_law_1.2,0.4796480178833008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,2,power_law_1.2,0.25458559989929197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,power_law_1.01,0.34586880207061765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,2,power_law_1.2,0.4810880184173584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,2,power_law_1.2,0.26458239555358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,balanced,1.5194080670674641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,power_law_1.01,0.4060224056243896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,2,power_law_1.2,0.4965504169464111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,2,power_law_1.2,0.2771392107009888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,balanced,2.0322559674580893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,2,power_law_1.2,0.29027841091156004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,power_law_1.01,0.40836482048034667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,2,power_law_1.2,0.5026495933532715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,power_law_1.01,0.4432384014129639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,2,power_law_1.2,0.2819391965866089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,2,power_law_1.2,0.5986048221588135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,balanced,3.0390345255533853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,power_law_1.01,0.4719423770904541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,2,power_law_1.2,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,2,power_law_1.2,0.3090816020965576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,2,power_law_1.2,0.5933568000793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,power_law_1.01,0.6993919849395752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,2,power_law_1.2,0.2911616086959839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,2,power_law_1.2,0.14384640455245973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,balanced,4.032191912333171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,2,power_law_1.2,0.6894656181335449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.01,0.858681583404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,2,power_law_1.2,0.3006079912185669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,2,power_law_1.2,0.1668992042541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,2,power_law_1.2,0.5529856204986572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.01,1.1549887657165527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,2,power_law_1.2,0.3086911916732788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,2,power_law_1.2,0.25594239234924315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,2,power_law_1.2,0.571392011642456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.01,1.7394048690795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,balanced,6.102671941121419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,2,power_law_1.2,0.34291839599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,2,power_law_1.2,0.25841920375823973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,2,power_law_1.2,0.5774784088134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.01,2.5901695251464845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,2,power_law_1.2,0.3818687915802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,2,power_law_1.2,0.28458240032196047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,2,power_law_1.2,0.6200255870819091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,2,power_law_1.2,0.44658560752868653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,2,power_law_1.2,0.3011775970458984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.01,3.5911487579345702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,balanced,8.164506912231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,2,power_law_1.2,0.6861631870269775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,2,power_law_1.2,0.3143232107162476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,2,power_law_1.2,0.4659711837768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.01,4.238028717041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,2,power_law_1.2,0.6935167789459229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,2,power_law_1.2,0.4294911861419678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,2,power_law_1.2,0.7141632080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.01,7.000627136230468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,2,power_law_1.2,0.5178815841674804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,2,power_law_1.2,0.306278395652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,2,power_law_1.2,0.8414463996887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,0.6656960010528564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,balanced,10.331621170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.01,10.31115493774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,2,power_law_1.2,0.3175487995147705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,0.8058815956115722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,2,power_law_1.2,1.0920319557189941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,balanced,0.1532960037390391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,1.0695808410644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,2,power_law_1.2,1.3764543533325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.01,15.615776062011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,balanced,0.25276267528533936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,2,power_law_1.2,0.3253247976303101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,1.4639424324035644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,2,power_law_1.2,1.8322816848754884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,balanced,0.48608001073201496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,2,power_law_1.2,0.32753279209136965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,power_law_1.01,18.818482971191408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,balanced,0.49008532365163165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,1.8473344802856446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,2,power_law_1.2,2.660966491699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,balanced,0.4912000099817912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,balanced,17.53222401936849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,2,power_law_1.2,0.3576575994491577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,2.712486457824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,balanced,0.49459731578826904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,2,power_law_1.2,3.3533824920654296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,2,power_law_1.2,0.386028790473938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,balanced,0.4960639874140422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,4.231116867065429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,power_law_1.01,31.77464904785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,balanced,0.5129493474960327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,2,power_law_1.2,0.3980288028717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,2,power_law_1.2,5.545542526245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,balanced,0.5094453493754069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,5.3517505645751955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,2,power_law_1.2,0.4312895774841309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,balanced,0.5161973237991333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,2,power_law_1.2,0.5024191856384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,balanced,0.5225866635640463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,2,power_law_1.2,7.065087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,6.726022338867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,2,power_law_1.2,0.7499072074890136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,balanced,0.5220853487650553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,balanced,0.5256533225377401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.2,0.9010496139526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,power_law_1.01,63.0986572265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,2,power_law_1.2,9.56732177734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,2,power_law_1.2,10.167110443115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,balanced,0.5600373347600301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.2,1.4961024284362794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,balanced,0.5773173173268636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.2,1.6695615768432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,balanced,0.575488011042277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,2,power_law_1.2,16.887628173828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,2,power_law_1.2,13.952569580078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,balanced,40.69892374674479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.2,2.33941764831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,balanced,0.6001439889272054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,balanced,0.6226933399836222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.2,3.328403091430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,2,power_law_1.2,17.858540344238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,2,power_law_1.2,25.131205749511718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,balanced,0.6554400126139323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.2,4.7007488250732425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,balanced,0.8471306959788004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,balanced,1.0094986756642659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.2,5.348543930053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,balanced,1.4477386474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,2,power_law_1.2,30.773138427734374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.2,9.781817626953124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,balanced,1.9126826922098796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,balanced,2.81223996480306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.2,13.150086975097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,balanced,3.7748425801595054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,2,power_law_1.2,58.872772216796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,2,power_law_1.2,17.55926971435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,balanced,6.371189117431641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,2,power_law_1.2,31.546572875976562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,balanced,8.132832209269205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,balanced,9.91592534383138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,2,power_law_1.2,77.5755126953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,balanced,15.668490091959635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,balanced,0.08984532952308655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,balanced,0.14545599619547525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,balanced,0.25677865743637085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,balanced,0.2618880073229472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,balanced,0.26263999938964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,balanced,39.812171936035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,balanced,0.26659200588862103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,balanced,0.2691253423690796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,balanced,0.08433600266774495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,balanced,0.2720373272895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,balanced,0.14028799533843994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,balanced,0.27462400992711383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,balanced,0.24996799230575562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,balanced,0.2754826744397481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,balanced,0.25517332553863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,balanced,0.2803200085957845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,balanced,0.2566453417142232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,balanced,0.28430400292078656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,balanced,0.26226667563120526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,balanced,0.26544533173243207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,balanced,0.2874880035718282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,balanced,0.267797331015269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,balanced,0.30373332897822064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,balanced,0.3120479981104533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,balanced,0.31722132364908856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,balanced,0.32807467381159466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,balanced,0.2720160086949666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,balanced,0.3909279902776082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,balanced,0.2755519946416219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,balanced,0.39984532197316486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,balanced,0.5232799847920736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,balanced,0.6266026496887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,balanced,0.8873226642608643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,balanced,0.28648000955581665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,balanced,1.143514633178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,balanced,0.2934719920158386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,balanced,1.6637867291768391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,balanced,0.29874666531880695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,balanced,0.3081013361612956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,balanced,0.33229867617289227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,balanced,2.3002613385518393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,balanced,0.34273068110148114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.1379583954811096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,balanced,0.3628693421681722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,balanced,0.49980799357096356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.21962239742279052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,balanced,3.4086828231811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,balanced,0.5464373429616293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.2642816066741943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,balanced,0.8115893205006918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.4685567855834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,balanced,1.083562692006429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,balanced,4.50924809773763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.4804992198944092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,balanced,1.6308213869730632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.49297919273376467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.0889024019241333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,balanced,2.171669324239095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.5178048133850097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.1343999981880188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,balanced,3.2540372212727866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.5005248069763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,balanced,5.569253285725911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.14620159864425658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.5096447944641114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.26213119029998777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,balanced,4.325285275777181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.5326975822448731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.01,0.25681281089782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.5322751998901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,power_law_1.01,0.08366720080375671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.26940159797668456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.5481344223022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,balanced,6.484773635864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,balanced,8.704282760620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.01,0.2743936061859131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.582860803604126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,power_law_1.01,0.11720960140228272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.01,0.2778879880905151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.587769603729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.13943040370941162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,power_law_1.01,0.14612480401992797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,balanced,8.690666834513346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.01,0.28044159412384034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.6353024005889892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.01,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.17509759664535524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,power_law_1.01,0.24813439846038818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.6302464008331299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.01,0.2867072105407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.2630336046218872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,power_law_1.01,0.25610239505767823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.6713664054870605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,balanced,11.024800618489584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.01,0.2969856023788452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.44525442123413084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,power_law_1.01,0.269267201423645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.7486783981323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.01,0.2966975927352905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.46851201057434083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,power_law_1.01,0.29244160652160645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.8409088134765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,balanced,17.827157338460285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.01,0.33580799102783204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.49411840438842775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,power_law_1.01,0.30713601112365724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.01,1.0269248008728027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.08910080194473266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.01,0.3586816072463989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.506982421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.11244159936904907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.01,0.3752000093460083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,balanced,18.508416493733723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.01,1.2974016189575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.5011328220367431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.1461951971054077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,power_law_1.01,0.2857215881347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.01,0.3784895896911621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.2548608064651489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.5167295932769775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.01,1.8631807327270509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,power_law_1.01,0.30587520599365237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.2558271884918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.01,0.4475071907043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,1,power_law_1.2,0.2713151931762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.5240767955780029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,0.4872960090637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,1,power_law_1.2,0.2787775993347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.01,2.276416015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.5367743968963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,1,power_law_1.2,0.2802432060241699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,0.613644790649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,1,power_law_1.2,0.2797696113586426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,power_law_1.01,0.3056256055831909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.5576064109802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.01,3.317900848388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,0.7551231861114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,1,power_law_1.2,0.2825216054916382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.5760064125061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,power_law_1.01,0.32222719192504884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,1,power_law_1.2,0.28286080360412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.01,4.297151947021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,1.023852825164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,1,power_law_1.2,0.30163838863372805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,power_law_1.01,0.33270399570465087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.5969535827636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,1,power_law_1.2,0.3004928112030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,1.2953920364379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.01,6.571186828613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,1,power_law_1.2,0.33971199989318845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.6224512100219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,power_law_1.01,0.35294079780578613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,1,power_law_1.2,0.3585216045379639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,balanced,41.19439951578776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,1.8127103805541993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.623744010925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,power_law_1.01,0.36145920753479005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,1,power_law_1.2,0.3634624004364014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.01,8.261721801757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.6757952213287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,2.360531234741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,power_law_1.01,0.37662079334259035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,1,power_law_1.2,0.37338240146636964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.752345609664917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,power_law_1.01,0.4303423881530762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,3.4715198516845702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,1,power_law_1.2,0.45107197761535645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.01,10.230790710449218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.8085824012756347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,power_law_1.01,0.5733248233795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,0.48679041862487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,4.595264053344726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,1,power_law_1.2,1.1113408088684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.01,0.7019968032836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,0.6267263889312744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.01,17.157656860351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,1,power_law_1.2,1.2812352180480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.01,5.661600112915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.01,0.9403136253356934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,0.746668815612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,1,power_law_1.2,0.08424959778785705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,1,power_law_1.2,1.828223991394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,1.0028223991394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.01,1.2089152336120605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.01,8.800755310058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,1,power_law_1.2,0.11262719631195069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,1,power_law_1.2,2.360576057434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,1.278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.01,1.7425792694091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,1,power_law_1.2,0.1422976016998291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.01,34.68970947265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,1,power_law_1.2,3.283430480957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,1.8323200225830079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.01,2.2892608642578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,1,power_law_1.2,0.24292480945587158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.01,17.90172119140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,1,power_law_1.2,4.305779266357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,2.3767936706542967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,1,power_law_1.2,0.2611583948135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.01,3.361894226074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,1,power_law_1.2,0.27501440048217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,3.501740646362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,1,power_law_1.2,6.636051177978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.01,4.433452987670899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,1,power_law_1.2,0.2817408084869385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,4.560793685913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,1,power_law_1.2,8.348089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,1,power_law_1.2,0.306278395652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.01,6.626732635498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,1,power_law_1.2,5.6219841003417965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,1,power_law_1.2,10.252230072021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.01,8.739148712158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,1,power_law_1.2,8.774092864990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,1,power_law_1.2,0.30247681140899657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,1,power_law_1.2,16.840269470214842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.01,10.99662094116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,1,power_law_1.2,0.31221120357513427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,1,power_law_1.2,17.903622436523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,power_law_1.01,18.496038818359374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,1,power_law_1.2,34.344357299804685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,1,power_law_1.2,0.30690560340881345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,1,power_law_1.2,0.3224384069442749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,1,power_law_1.2,0.34082560539245604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,power_law_1.01,40.06552429199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,1,power_law_1.2,0.3650880098342896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,1,power_law_1.2,0.3734911918640137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,1,power_law_1.2,0.38316800594329836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,1,power_law_1.2,0.45776000022888186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,1,power_law_1.2,0.577945613861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.2,0.6961855888366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.2,0.9786944389343262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.2,1.2210623741149902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.2,1.7931200027465821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.2,2.3390079498291017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.2,3.461119842529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.2,4.535801696777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.2,6.736204528808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.2,8.989427185058593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.2,11.16314239501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,1,power_law_1.2,18.05644836425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,balanced,0.22007467349370322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,1,power_law_1.2,38.64787292480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,balanced,0.41891733805338544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,balanced,0.8133973280588785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,balanced,0.8057173093159994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,balanced,0.8049493630727133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,balanced,0.8063413302103678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,balanced,0.8055786291758219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,balanced,0.8065706888834635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,balanced,0.8268266518910726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,balanced,0.8308107058207194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,balanced,0.8393226464589437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,balanced,0.13481066624323526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,balanced,0.8490239779154459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,balanced,0.8502079645792643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,balanced,0.2320800026257833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,balanced,0.8841386636098226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,balanced,0.9022239844004313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,balanced,0.42743468284606934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,balanced,0.9010186990102133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,balanced,0.4275199969609578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,balanced,0.9191093444824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,balanced,0.42817068099975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,balanced,1.0520906448364258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,balanced,0.43221867084503174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,balanced,1.063157320022583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,balanced,1.3604373931884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,balanced,0.4344746669133504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,balanced,0.43769601980845135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,balanced,1.7247519493103027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,balanced,0.43833601474761963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,balanced,2.458463986714681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,balanced,0.4426560004552205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,balanced,2.9515040715535483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,balanced,0.4584266742070516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,balanced,4.641632080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,balanced,0.45102934042612713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,balanced,0.45322132110595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,balanced,6.281226476033528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,balanced,0.4687093496322632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.01,0.34286720752716066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,balanced,0.48556268215179443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.01,0.42074241638183596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,balanced,0.4899253447850545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.01,0.5568895816802979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,balanced,10.411114374796549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,balanced,0.504746675491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.01,0.8067904472351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.01,0.7700736045837402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,balanced,0.6054346561431885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.01,0.8156671524047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,balanced,12.763130187988281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,balanced,0.6186879873275757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.1931712031364441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.01,0.8328895568847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,balanced,0.146506667137146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,balanced,0.8108906745910645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.01,0.8388352394104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,balanced,0.2241706649462382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.2552191972732544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,balanced,0.9602719942728678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.01,0.8626239776611329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,balanced,0.4118719895680745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.01,0.29456000328063964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,balanced,16.461135864257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,balanced,0.41741331418355304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.01,0.8774975776672364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,balanced,1.383562723795573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.01,0.42722558975219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,balanced,0.41886401176452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.01,0.9364864349365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,power_law_1.01,0.2251904010772705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,balanced,0.42483198642730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,balanced,1.772058645884196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.01,0.4264832019805908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.01,0.9730560302734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,balanced,0.42838935057322186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.01,0.4385536193847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,balanced,0.4310986598332723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.01,1.0241215705871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,balanced,2.6941121419270835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,power_law_1.01,0.24698240756988527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.01,0.4555647850036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,2,power_law_1.2,0.38040320873260497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.01,0.9425024032592774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.01,0.4506368160247803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,balanced,27.557993570963543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,2,power_law_1.2,0.5474239826202393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,balanced,3.3255573908487954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.01,1.0687359809875487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,power_law_1.01,0.24724481105804444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.01,0.4541440010070801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,2,power_law_1.2,0.5159872055053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,balanced,0.4358666737874349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.01,1.1311296463012694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,power_law_1.01,0.4179327964782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.01,0.46894078254699706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,balanced,0.4397493203481038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,2,power_law_1.2,0.8067263603210449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.01,1.167955207824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,balanced,5.124016125996907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,power_law_1.01,0.4210559844970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.01,0.4989312171936035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,2,power_law_1.2,0.8038975715637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.01,1.3474495887756348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,power_law_1.01,0.464415979385376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.01,0.5569727897644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,2,power_law_1.2,0.8226367950439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.01,1.743788719177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,power_law_1.01,0.5339903831481934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.01,0.5718912124633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,balanced,7.436496098836263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,2,power_law_1.2,0.8418815612792969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.01,2.2998079299926757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,power_law_1.01,0.5695744037628174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.01,0.5798143863677978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,2,power_law_1.2,0.8283647537231446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.01,2.8545343399047853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.01,0.7145215988159179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,2,power_law_1.2,0.8632063865661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,balanced,0.44867201646169025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.01,0.7084479808807373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,2,power_law_1.2,0.8788224220275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,balanced,0.4548373222351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.01,4.748608016967774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,balanced,9.479007720947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,power_law_1.01,0.5423679828643799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,balanced,54.9931894938151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,balanced,0.46247466405232746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.01,0.6419648170471192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,2,power_law_1.2,0.9429439544677735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.01,4.527795028686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,power_law_1.01,0.5415103912353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,balanced,0.470634659131368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.01,0.7886144161224365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,2,power_law_1.2,0.9550335884094239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.01,7.73966064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,0.9607680320739747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,2,power_law_1.2,1.1040767669677733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,power_law_1.01,0.48925437927246096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,1.24268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,2,power_law_1.2,0.9374784469604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,balanced,15.323744455973307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.01,14.068185424804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,balanced,0.49375466505686444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,power_law_1.01,0.5557375907897949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,1.4282560348510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,2,power_law_1.2,1.0919743537902833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,balanced,0.5056586662928263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,2.2397247314453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,2,power_law_1.2,1.1291007995605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,balanced,0.5296106735865275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,power_law_1.01,0.5767871856689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.01,19.645465087890624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,2.9673471450805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,balanced,0.7488053639729818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,2,power_law_1.2,1.1565312385559081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,power_law_1.01,0.6356736183166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,balanced,0.8001759847005209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,4.292601776123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,2,power_law_1.2,1.4079039573669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.01,21.65617980957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,2,power_law_1.2,1.6298368453979493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,5.982886505126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,2,power_law_1.2,2.0042560577392576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,power_law_1.01,0.5873600006103515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.22931840419769287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,8.428614044189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,2,power_law_1.2,3.1369279861450194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.01,28.17586669921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,balanced,1.1973973115285237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.27888638973236085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,power_law_1.01,0.7127999782562255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,balanced,30.577679951985676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,2,power_law_1.2,4.492716979980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,11.660575866699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,2,power_law_1.2,0.2817728042602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,balanced,1.5769333839416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,power_law_1.01,0.8546303749084473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,2,power_law_1.2,0.43756799697875975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,2,power_law_1.2,5.870054244995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,balanced,2.3866559664408364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.01,43.889260864257814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,2,power_law_1.2,0.438259220123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.01,17.58074951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,power_law_1.01,0.996889591217041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,2,power_law_1.2,9.030611419677735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,balanced,3.167071978251139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,2,power_law_1.2,0.44704642295837405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.01,1.296121597290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,2,power_law_1.2,0.4656832218170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,balanced,4.7806345621744795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,2,power_law_1.2,13.880601501464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.01,26.148959350585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,2,power_law_1.2,0.45885438919067384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.01,1.9199359893798829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,2,power_law_1.2,0.46849918365478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,balanced,6.484474817911784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,2,power_law_1.2,18.915481567382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.01,2.172665596008301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,2,power_law_1.2,0.4746240139007568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.01,3.1584768295288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,2,power_law_1.2,0.4891200065612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.01,49.110015869140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.01,105.06173095703124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,balanced,9.969600041707357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,2,power_law_1.2,24.362655639648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.01,4.985343933105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,2,power_law_1.2,0.5083903789520263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,2,power_law_1.2,0.5583360195159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.01,6.469439697265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,2,power_law_1.2,0.6318463802337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,2,power_law_1.2,27.45081481933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,balanced,13.861573537190756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,2,power_law_1.2,0.6647679805755615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.01,10.3853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,2,power_law_1.2,0.7521471977233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,2,power_law_1.2,0.6965184211730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,2,power_law_1.2,40.96058959960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,balanced,18.44858678181966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.01,14.041285705566406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,2,power_law_1.2,0.786572790145874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,1.0423232078552247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,1.202950382232666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.01,23.802035522460937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,1.5819392204284668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,2.590246391296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,balanced,32.641563415527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,2.6565248489379885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,power_law_1.01,35.22505493164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,2,power_law_1.2,107.2416748046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,5.735289764404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,6.302777481079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,8.128543853759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,power_law_1.01,62.74547119140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,13.193093872070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,2,power_law_1.2,17.388812255859374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,balanced,75.19704691569011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,2,power_law_1.2,23.573753356933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,power_law_1.01,113.89019775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,2,power_law_1.2,45.94355773925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,2,power_law_1.2,0.18914560079574586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,2,power_law_1.2,0.24615039825439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,2,power_law_1.2,0.24771199226379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,2,power_law_1.2,0.3675839900970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,2,power_law_1.2,0.4210559844970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,2,power_law_1.2,0.4682112216949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,2,power_law_1.2,0.5268479824066162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,2,power_law_1.2,0.5568384170532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,2,power_law_1.2,0.5588479995727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,2,power_law_1.2,0.5547967910766601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,balanced,0.23905066649119058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,2,power_law_1.2,0.49855360984802244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,2,power_law_1.2,0.5319039821624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,balanced,0.4181973139444987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,2,power_law_1.2,0.5459072113037109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,2,power_law_1.2,0.663270378112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,balanced,0.7904213269551595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,2,power_law_1.2,0.6420991897583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,balanced,0.7953653335571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,2,power_law_1.2,0.6790783882141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,balanced,0.7962720394134521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,2,power_law_1.2,0.8190143585205079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,balanced,0.14241066575050354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,2,power_law_1.2,1.053433609008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,balanced,0.8004906972249349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.2,1.4341376304626465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,balanced,0.22736533482869467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,balanced,0.8012373447418213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,balanced,0.4190239906311035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,balanced,0.8046560287475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.2,1.9714111328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,balanced,0.42535467942555744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,balanced,0.8258506457010905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.2,3.0921663284301757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,balanced,0.4238506555557251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,balanced,0.82969069480896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,balanced,0.8471360206604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,balanced,0.4278666575749715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.2,4.2545215606689455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,balanced,0.43379731973012287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,balanced,0.8431680202484131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.2,5.012179183959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,balanced,0.845029354095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,balanced,0.4355893135070801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,balanced,0.1439893345038096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,balanced,0.8878826300303141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.2,7.401849365234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,balanced,0.4378559986750285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,balanced,0.22172266244888306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,balanced,0.9064959685007731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,balanced,0.44040000438690186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,balanced,0.40959465503692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.2,11.540576171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,balanced,0.9053973356882731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,balanced,0.4490346511205037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,balanced,0.4142986536026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,balanced,0.9339146614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,balanced,0.45422399044036865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,balanced,0.4171946843465169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,balanced,1.0094239711761475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.2,16.150656127929686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,balanced,0.4571146567662557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,balanced,0.422757347424825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,balanced,1.0332053502400715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,balanced,0.42850665251413983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,balanced,0.47655999660491943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,balanced,1.3238506317138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,balanced,0.43115198612213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.24151039123535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.2,23.380184936523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,balanced,0.48661335309346515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,balanced,1.6570080121358235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.347871994972229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,balanced,0.4888693491617839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,balanced,2.4475839932759604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.36017279624938964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,balanced,0.51473601659139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,2,power_law_1.2,32.082516479492185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,balanced,3.0318241119384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.7450560092926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,balanced,0.4376000165939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,balanced,0.6126240094502767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.7624703884124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,balanced,4.6582291920979815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,balanced,0.44350401560465497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,balanced,0.6200853188832601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.7905600070953369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,balanced,0.8200266361236572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.8204095840454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,balanced,6.681882858276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.8296704292297363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,balanced,0.9945173263549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,2,power_law_1.2,61.925469970703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.8404864311218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,balanced,1.4068214098612468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.01,0.8894271850585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,balanced,10.356229146321615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.01,0.8832192420959473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,balanced,1.8073439598083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.01,0.9470911979675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,balanced,0.4549226760864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,balanced,2.615935961405436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.01,0.9546815872192382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,balanced,0.4642133315404256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.14796160459518432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,balanced,13.404954274495443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.01,0.9158783912658691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,balanced,0.47169065475463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,balanced,3.7218828201293945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.01,0.9705023765563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.1813055992126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,balanced,0.4834880034128825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.01,1.0195391654968262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.21887359619140626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,balanced,0.5107306639353434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.2437824010848999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.01,1.0600000381469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.01,0.41239042282104493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,balanced,5.548170725504558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,balanced,16.89669926961263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,balanced,0.5239786704381307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.2873408079147339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,2,power_law_1.2,144.24364013671874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.01,1.2698495864868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.01,0.40415358543395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,balanced,0.5542986790339152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,power_law_1.01,0.13861119747161865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.44892158508300783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.01,1.409926414489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.01,0.43260798454284666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,balanced,0.7871786753336588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.7778751850128174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,power_law_1.01,0.14888960123062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.01,1.8383359909057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,balanced,8.014229456583658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.01,0.450438404083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.7791168212890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,balanced,0.8558133443196615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,power_law_1.01,0.2262655973434448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.01,2.1743423461914064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.01,0.45264639854431155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.8083583831787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,power_law_1.01,0.4244863986968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,balanced,1.2756053606669109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.01,2.99865608215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,power_law_1.01,0.4174079895019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.01,0.4554175853729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.8279168128967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,balanced,27.712682088216145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,balanced,1.6947466532389324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,balanced,9.916943868001303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.8221887588500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,power_law_1.01,0.44204158782958985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.01,0.470246410369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.01,3.9596416473388674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,balanced,2.558666706085205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.8424384117126464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,power_law_1.01,0.4718592166900635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.01,0.4675583839416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.01,5.785452651977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,1,power_law_1.2,0.8984448432922363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,power_law_1.01,0.5019264221191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,balanced,3.415098508199056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.01,0.4932864189147949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.01,7.612409973144532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,1,power_law_1.2,0.8949119567871093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.01,0.504095983505249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,balanced,5.138325373331706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,1,power_law_1.2,0.9292223930358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.01,0.5110784053802491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,power_law_1.01,0.4852543830871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.01,11.833760070800782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,balanced,16.242005666097004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,1,power_law_1.2,1.0012031555175782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.01,0.5269248008728027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,power_law_1.01,0.5324992179870606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,1,power_law_1.2,0.9273344039916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,balanced,6.919354756673177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.01,0.5621056079864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.01,13.577299499511719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,1,power_law_1.2,1.0029824256896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.01,0.5806079864501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,1,power_law_1.2,1.025715160369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.01,0.6923711776733399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,1,power_law_1.2,1.0607104301452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,power_law_1.01,0.4854144096374512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.01,17.010041809082033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,balanced,10.741130828857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,balanced,55.173868815104164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,1,power_law_1.2,1.2656512260437012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,0.7540031909942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,power_law_1.01,0.4959871768951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,1,power_law_1.2,1.406879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,1.0150848388671876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,power_law_1.01,0.5266816139221191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,1.2045632362365724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,1,power_law_1.2,1.7641088485717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.01,28.300576782226564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,power_law_1.01,0.5767168045043946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,1.6871807098388671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,balanced,14.849562327067057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,1,power_law_1.2,2.1950847625732424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,power_law_1.01,0.5765183925628662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,2.14400634765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,balanced,30.01995086669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,1,power_law_1.2,2.98353271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,power_law_1.01,0.6070400238037109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,3.0424575805664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,power_law_1.01,0.7120192050933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,1,power_law_1.2,3.8878273010253905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,3.8731903076171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,power_law_1.01,0.9114496231079101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.01,55.716802978515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,1,power_law_1.2,5.995897674560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,balanced,19.363819122314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.01,1.1409472465515136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,5.747155380249024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,1,power_law_1.2,7.651936340332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.01,1.5316864013671876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,8.138739013671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,1,power_law_1.2,11.682418823242188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.01,1.9636159896850587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.01,10.085088348388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,1,power_law_1.2,13.576626586914063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.01,2.851033592224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,balanced,34.142822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.01,3.682521438598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.01,15.766035461425782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,1,power_law_1.2,16.807693481445312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.01,5.414438247680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.01,7.1853187561035154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,1,power_law_1.2,28.021087646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.01,28.571450805664064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.01,10.716416168212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.01,14.422720336914063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,1,power_law_1.2,54.96534423828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.01,18.71448974609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,balanced,75.32865397135417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,power_law_1.01,31.797918701171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,power_law_1.01,72.01856079101563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.13123199939727784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.1728127956390381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.21763200759887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,1,power_law_1.2,0.4030464172363281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,1,power_law_1.2,0.41466240882873534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,1,power_law_1.2,0.43396477699279784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,1,power_law_1.2,0.44941439628601076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,1,power_law_1.2,0.44434561729431155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,1,power_law_1.2,0.45649280548095705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,1,power_law_1.2,0.46535677909851075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,1,power_law_1.2,0.46072959899902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,1,power_law_1.2,0.48207998275756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,1,power_law_1.2,0.5022784233093261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,1,power_law_1.2,0.5061183929443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,1,power_law_1.2,0.5325568199157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,1,power_law_1.2,0.5422016143798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,1,power_law_1.2,0.574892807006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,1,power_law_1.2,0.7035711765289306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,0.7757440090179444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,1.02357759475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,1.2195520401000977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,1.6362815856933595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,2.0559551239013674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,3.077427291870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,1,power_law_1.2,0.13959039449691774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,1,power_law_1.2,0.1755136013031006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,3.891244888305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,1,power_law_1.2,0.20283520221710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,1,power_law_1.2,0.3940927982330322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,5.739251327514649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,1,power_law_1.2,0.41617918014526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,1,power_law_1.2,0.45342721939086916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,8.158477020263671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,1,power_law_1.2,0.48372478485107423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,1,power_law_1.2,0.521888017654419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,1,power_law_1.2,9.971161651611329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,1,power_law_1.2,0.49320321083068847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,1,power_law_1.2,15.869888305664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,1,power_law_1.2,0.4961408138275146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,1,power_law_1.2,29.662823486328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,1,power_law_1.2,0.48458237648010255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,1,power_law_1.2,0.509715223312378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,1,power_law_1.2,0.528927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,1,power_law_1.2,0.582476806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,1,power_law_1.2,0.5497600078582764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,1,power_law_1.2,0.608844804763794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,1,power_law_1.2,0.6944896221160889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,balanced,0.11028800408045451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,1,power_law_1.2,0.8905216217041015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,balanced,0.1755946675936381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.2,1.0827648162841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,balanced,0.15685866276423135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,balanced,0.2648373246192932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.2,1.498265552520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.2,1.897145652770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,balanced,0.4843839804331462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,balanced,0.2704586585362752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.2,2.7408832550048827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,balanced,0.9386879603068033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,balanced,0.5008639891942342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.2,3.5841854095458983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,balanced,0.96014936765035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,balanced,1.844373385111491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.2,5.291187286376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,balanced,1.8777920405069988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,balanced,3.6581598917643228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.2,6.99939193725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,balanced,1.8767253557840984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,balanced,3.6653547286987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.2,10.62512664794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,balanced,1.8787466684977214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,balanced,3.6589492162068686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,balanced,1.8893067042032878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.2,14.5478271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,balanced,3.679861386617025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,balanced,1.8898560206095378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,balanced,3.6829067866007485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.2,18.686015319824218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,balanced,1.8963039716084797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,balanced,3.6942612330118814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,balanced,1.9099520047505696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.01,0.2928319931030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,balanced,3.7120958964029946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,1,power_law_1.2,32.08651428222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,balanced,1.91484800974528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.01,0.4892223834991455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,balanced,3.7216053009033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,balanced,1.9425493876139324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.01,0.44396162033081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,balanced,3.6856053670247397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,balanced,1.9570026397705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.01,0.7363135814666748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,balanced,1.9679199854532878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.01,1.1869248390197753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,balanced,3.7162399291992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.01,1.7562688827514648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,balanced,2.0147199630737305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,balanced,3.7215305964152017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,1,power_law_1.2,72.27020874023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.01,2.571615982055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.17555199861526488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,balanced,0.12685867150624594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,balanced,2.0625173250834146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,balanced,3.8569065729777017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.01,2.698137664794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.01,0.2693183898925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,balanced,0.17007466157277426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.01,2.787180709838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,balanced,3.9023733139038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,balanced,2.109781265258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,balanced,0.32068800926208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.01,0.2714495897293091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,balanced,0.5165493488311768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.01,2.830860710144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.01,0.38815999031066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,balanced,3.9895785649617515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,balanced,2.1632960637410483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.01,0.615718412399292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.01,2.9475711822509765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,balanced,0.9491199652353922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,balanced,4.080933252970378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.01,0.9020544052124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.01,2.961414337158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,balanced,1.8340694109598796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,balanced,2.31002140045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.01,1.2222335815429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.01,3.1485504150390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,balanced,1.8450826009114583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,balanced,4.293530782063802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.01,1.388371181488037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,balanced,1.8511999448140461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.01,3.167571258544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,balanced,2.4474132855733237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,power_law_1.01,0.20421760082244872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.01,1.4223936080932618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.01,3.2126846313476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,balanced,1.8583359718322754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,balanced,4.438960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.01,1.4815872192382813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,power_law_1.01,0.30517120361328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.01,3.320460891723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,balanced,1.8672266006469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,power_law_1.01,0.2349247932434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.01,1.590771198272705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.01,3.6864704132080077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,balanced,2.619215965270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,balanced,1.8839893341064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,power_law_1.01,0.3908544063568115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,balanced,4.663781483968099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.01,4.152812957763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.01,1.683577537536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,balanced,1.9007679621378581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.01,4.260332870483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,power_law_1.01,0.6949056148529053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.01,1.6365951538085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.01,4.831782531738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,power_law_1.01,0.929088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,balanced,1.913248062133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.01,1.7350208282470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.01,4.321120071411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,balanced,3.211455980936686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,power_law_1.01,1.2910271644592286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,balanced,5.109104156494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,balanced,1.9378239313761394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.01,1.7212863922119142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.01,4.918495941162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,power_law_1.01,1.4500351905822755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,balanced,1.9644959767659504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.01,1.8012287139892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.01,5.574444961547852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,power_law_1.01,1.4875904083251954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,balanced,1.9892266591389973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.01,2.0633663177490233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,power_law_1.01,1.5291071891784669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.01,6.487296295166016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,balanced,3.4966932932535806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.01,2.2234495162963865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,balanced,2.0490293502807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,balanced,5.520240147908528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,power_law_1.01,1.6062271118164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.01,7.752793884277343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,2.166444778442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,power_law_1.01,1.6685888290405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.01,10.658834838867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,2.534931182861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,power_law_1.01,1.739084815979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,2.35351676940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,power_law_1.01,1.8676544189453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.01,14.741542053222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,balanced,2.1590347290039062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,power_law_1.01,2.056934356689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,2.661843109130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,balanced,4.39845339457194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,balanced,7.093503952026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,power_law_1.01,2.170694351196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,2.9188671112060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.01,16.538003540039064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,power_law_1.01,2.4012800216674806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,3.6109695434570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.01,27.239443969726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,4.495750427246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,power_law_1.01,2.4562047958374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,6.220012664794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,balanced,2.2836052576700845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,7.8689216613769535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,balanced,5.919818878173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.01,45.473095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.01,2.4178239822387697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,balanced,9.21569569905599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.01,9.543289947509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,balanced,2.478208065032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.01,2.929190444946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,balanced,2.6525012652079263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.01,12.464403533935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.01,3.3409984588623045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.01,3.653472137451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,balanced,3.054848035176595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.01,4.435456085205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.01,24.79842529296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.01,5.7518657684326175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,balanced,7.001834869384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,balanced,3.3997227350870767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.01,7.203993225097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,balanced,11.880666097005209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.01,10.37741470336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,balanced,5.191946665445964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.01,13.745420837402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,power_law_1.01,16.222720336914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,balanced,6.061007817586263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.01,27.75941162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,2,power_law_1.2,0.28986239433288574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,2,power_law_1.2,0.490118408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,2,power_law_1.2,0.3324160099029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,balanced,10.954762776692709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,2,power_law_1.2,0.6196479797363281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,power_law_1.01,58.75968017578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,2,power_law_1.2,1.0594367980957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,balanced,9.061349232991537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,balanced,24.53399403889974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,2,power_law_1.2,1.4778688430786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,2,power_law_1.2,2.4303871154785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,2,power_law_1.2,2.617612838745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,2,power_law_1.2,2.6890560150146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,2,power_law_1.2,2.9217599868774413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,balanced,12.767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,2,power_law_1.2,2.9993663787841798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,2,power_law_1.2,3.1136512756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,2,power_law_1.2,3.2434497833251954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,2,power_law_1.2,3.1465280532836912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,2,power_law_1.2,3.327769470214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,2,power_law_1.2,3.4292415618896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.17594879865646362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,2,power_law_1.2,3.861075210571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,2,power_law_1.2,0.25763840675354005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,2,power_law_1.2,4.2153984069824215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,2,power_law_1.2,0.19468799829483033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,balanced,15.849093119303385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,2,power_law_1.2,4.546527862548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,2,power_law_1.2,0.3732032060623169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,2,power_law_1.2,0.5859776020050049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,2,power_law_1.2,5.195455932617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,2,power_law_1.2,0.7888959884643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,2,power_law_1.2,4.555033493041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,2,power_law_1.2,1.2309632301330566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,2,power_law_1.2,5.286054229736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,2,power_law_1.2,1.3453503608703614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,2,power_law_1.2,6.010092926025391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,2,power_law_1.2,1.3517631530761718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,balanced,22.144564310709637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,2,power_law_1.2,1.5025152206420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,2,power_law_1.2,7.527897644042969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,2,power_law_1.2,1.5714624404907227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,2,power_law_1.2,8.942009735107423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,2,power_law_1.2,1.6221632003784179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,balanced,39.3825429280599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,2,power_law_1.2,1.7170944213867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,2,power_law_1.2,11.95265884399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,2,power_law_1.2,1.7526527404785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,2,power_law_1.2,1.8701055526733399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,2,power_law_1.2,1.918022346496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,2,power_law_1.2,15.537799072265624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,2,power_law_1.2,2.0570240020751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,2,power_law_1.2,2.3601472854614256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,balanced,27.29186248779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,2,power_law_1.2,19.862745666503905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,2.359916877746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,2.6924095153808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,2.389606475830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,2,power_law_1.2,25.903781127929687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,2.834067153930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,3.335744094848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,3.955148696899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,4.673958587646484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,2,power_law_1.2,48.86982421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,6.713043212890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,7.947698974609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,2,power_law_1.2,9.866099548339843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,2,power_law_1.2,12.635155487060548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,2,power_law_1.2,25.610833740234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,2,power_law_1.2,0.1901952028274536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,2,power_law_1.2,0.2843071937561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,2,power_law_1.2,0.21509759426116942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,2,power_law_1.2,0.3799040079116821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,balanced,0.1774079998334249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,2,power_law_1.2,0.5727807998657226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,2,power_law_1.2,0.794271993637085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,balanced,0.26580266157786053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,balanced,54.581380208333336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,2,power_law_1.2,1.3046208381652833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,balanced,0.49113066991170246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,2,power_law_1.2,1.3533696174621581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,2,power_law_1.2,1.3923775672912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,balanced,0.9556960264841715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,2,power_law_1.2,1.48156795501709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,2,power_law_1.2,1.5606016159057616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,balanced,1.8505333264668782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,2,power_law_1.2,1.6555648803710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,balanced,3.6526880264282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,2,power_law_1.2,1.763545608520508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,2,power_law_1.2,1.8625984191894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,balanced,3.6579198837280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,2,power_law_1.2,2.0442304611206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,balanced,3.6728693644205728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,2,power_law_1.2,2.2123392105102537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,balanced,3.6736319859822593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,2,power_law_1.2,2.418841552734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,balanced,3.6801973978678384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,balanced,0.11173866192499797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,balanced,3.70142396291097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,2,power_law_1.2,2.58154239654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,balanced,0.16144532958666483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,balanced,3.7081705729166665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,balanced,0.27987200021743774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,balanced,3.717461268107096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.2,2.4791744232177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,balanced,0.5213599999745687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,balanced,3.7477814356486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.2,2.8593984603881837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,balanced,0.9943946997324625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,balanced,3.7519200642903647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.2,3.460492706298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,balanced,1.9535306294759114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,balanced,1.9827146530151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.2,3.72806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,balanced,3.779658635457357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,balanced,1.9702986081441243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.2,4.412691116333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,balanced,3.836832046508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,balanced,1.9845493634541829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.2,6.179340744018555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,balanced,4.008965492248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,balanced,2.0044800440470376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,balanced,1.9956906636555989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.2,8.323814392089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,balanced,4.1582291920979815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,balanced,2.0106239318847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.2,10.77925796508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,balanced,4.30787722269694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,balanced,2.0368107159932456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,balanced,2.0658772786458335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.2,15.539642333984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,balanced,4.527957280476888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,balanced,2.08679993947347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,2,power_law_1.2,18.701997375488283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,balanced,2.0960213343302407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,balanced,4.819781303405762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,balanced,2.134138743082682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,balanced,2.214458624521891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.2,29.713894653320313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,balanced,5.080160140991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,balanced,2.2551306088765464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,balanced,2.355050722757975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,balanced,6.15232531229655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,balanced,2.541312058766683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,2,power_law_1.2,56.86739501953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,balanced,2.792949358622233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,balanced,0.15844800074895224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,balanced,6.961141586303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,balanced,0.19850132862726846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,balanced,3.0604426066080728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.17449599504470825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,balanced,0.3425706624984741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,balanced,0.5390239953994751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.2649152040481567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,balanced,0.973365306854248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.3296639919281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,balanced,1.863690694173177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,balanced,3.672954559326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,balanced,1.879866600036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.7168831825256348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,balanced,8.760079701741537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,balanced,1.8951999346415203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,balanced,1.9052693049112956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.01,1.1524479866027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,balanced,1.915770689646403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.01,1.5956607818603517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,balanced,1.9370080629984539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,balanced,4.350319862365723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.01,2.440390396118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,balanced,1.9672640164693196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,balanced,1.9830293655395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.01,2.6775232315063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,balanced,2.0293919245402017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.01,2.6846080780029298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,balanced,2.080730597178141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,balanced,10.815914154052734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.01,2.8706687927246093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,balanced,2.1201119422912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.01,2.9036544799804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,balanced,5.781791687011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,balanced,2.2007412910461426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.11087360382080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.01,2.970137596130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.01,3.0827392578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.15808639526367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.01,0.17559679746627807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.01,3.1897727966308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.01,0.39127678871154786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.01,3.2028865814208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,balanced,2.370944023132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.01,0.6291967868804932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.01,3.374496078491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.01,0.8950143814086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,balanced,7.4821014404296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,balanced,12.707115173339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.01,3.601919937133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.01,1.2875904083251952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.01,1.3714752197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.01,3.8712703704833986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.01,1.4315839767456056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,power_law_1.01,0.156550395488739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.01,4.383391952514648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.01,1.4917695999145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,power_law_1.01,0.21438078880310057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.01,1.4958847999572753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.01,5.019027328491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,balanced,2.561072031656901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,power_law_1.01,0.22033278942108153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.01,1.6065471649169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.01,4.563859176635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,power_law_1.01,0.4099008083343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.01,1.6262336730957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,power_law_1.01,0.6227456092834472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.01,5.141209411621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.01,1.706937599182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,balanced,2.899807929992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,power_law_1.01,0.876467227935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.01,1.813497543334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.01,5.718124771118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,power_law_1.01,1.268064022064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,balanced,8.991856257120768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.01,1.8704767227172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,balanced,3.197744051615397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,power_law_1.01,1.374291229248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.01,6.868946838378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.01,1.9988672256469726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,power_law_1.01,1.442124843597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.01,2.2244543075561523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,power_law_1.01,1.4791616439819335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.01,8.194226837158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,balanced,3.9332907994588218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,power_law_1.01,1.5853055953979491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,2.260684776306152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.01,11.03623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,power_law_1.01,1.6857023239135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,balanced,20.602986653645832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,2.5182592391967775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,power_law_1.01,1.7762432098388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,2.3804351806640627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,balanced,4.538448015848796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.01,14.710054016113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.17441920042037964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,power_law_1.01,1.904204750061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,2.702444839477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,power_law_1.01,2.0901119232177736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.2540544033050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,3.0793216705322264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,power_law_1.01,2.2121599197387694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.01,17.81562194824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.33758718967437745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,3.9368385314941405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,power_law_1.01,2.468953514099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,balanced,7.237781524658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.6047359943389893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,4.782969665527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,1,power_law_1.2,1.0142271995544434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.01,24.438374328613282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,1,power_law_1.2,1.4792960166931153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,6.586528015136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,power_law_1.01,2.5635520935058596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,balanced,15.31760025024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,1,power_law_1.2,2.4089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,8.476780700683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,balanced,8.736143747965494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,1,power_law_1.2,2.567475128173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.01,2.579167938232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.01,41.335488891601564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,1,power_law_1.2,2.7213695526123045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.01,10.350003051757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.01,3.1314367294311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,1,power_law_1.2,2.631315231323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.01,3.6528385162353514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.01,17.044160461425783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.01,4.356159973144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,1,power_law_1.2,2.907142448425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.01,5.280710220336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,1,power_law_1.2,3.0315135955810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.01,7.1730499267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,balanced,12.479700724283854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,1,power_law_1.2,3.0796672821044924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.01,31.746368408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.01,9.237926483154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,1,power_law_1.2,3.291948699951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.01,13.379283142089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,1,power_law_1.2,3.3954303741455076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,1,power_law_1.2,3.498463821411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.01,17.40804443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,1,power_law_1.2,3.667641448974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.01,21.50232391357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,1,power_law_1.2,4.086739349365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,balanced,17.455460866292317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,1,power_law_1.2,4.701408004760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,balanced,43.899983723958336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,power_law_1.01,33.68748168945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,1,power_law_1.2,5.421612930297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,1,power_law_1.2,4.882137680053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,1,power_law_1.2,5.485548782348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,1,power_law_1.2,6.088864135742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,power_law_1.01,69.66751098632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,1,power_law_1.2,7.598105621337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,balanced,21.471242268880207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,balanced,31.68530782063802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,1,power_law_1.2,9.08251495361328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.11084159612655639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.15760639905929566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,1,power_law_1.2,12.2052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,1,power_law_1.2,0.18187520503997803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,1,power_law_1.2,0.36364800930023194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,1,power_law_1.2,15.514533996582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,1,power_law_1.2,0.5664383888244628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,1,power_law_1.2,0.7756351947784423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,1,power_law_1.2,18.567872619628908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,1,power_law_1.2,1.2506560325622558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,1,power_law_1.2,1.390118408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,1,power_law_1.2,1.3646464347839355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,1,power_law_1.2,23.640403747558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,1,power_law_1.2,1.457919979095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,1,power_law_1.2,1.52673282623291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,1,power_law_1.2,1.6254079818725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,1,power_law_1.2,1.7109376907348632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,1,power_law_1.2,40.903628540039065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,1,power_law_1.2,1.7254335403442382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,balanced,36.29330698649088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,1,power_law_1.2,1.8780607223510741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,1,power_law_1.2,1.9156608581542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,1,power_law_1.2,2.0716991424560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,1,power_law_1.2,2.3496959686279295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,2.3217920303344726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,2.6487808227539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,2.5546560287475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,2.932896041870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,3.3749183654785155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,4.203308868408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,5.102944183349609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,6.8969474792480465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,8.849318695068359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,1,power_law_1.2,10.646784210205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,1,power_law_1.2,17.206080627441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,1,power_law_1.2,31.132199096679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,balanced,73.05638631184895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,1,power_law_1.2,0.16613119840621948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,1,power_law_1.2,0.20563840866088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,balanced,0.032730666299661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,1,power_law_1.2,0.23174400329589845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,1,power_law_1.2,0.380947208404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,balanced,0.0492799977461497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,balanced,0.07441600163777669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,1,power_law_1.2,0.5910655975341796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,1,power_law_1.2,0.7718336105346679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,balanced,0.12441600362459819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,1,power_law_1.2,1.2834431648254394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,balanced,0.22132267554601034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,1,power_law_1.2,1.3314687728881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,balanced,0.2226346731185913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,1,power_law_1.2,1.3895551681518554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,balanced,0.22376533349355063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,1,power_law_1.2,1.4783552169799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,balanced,0.22518932819366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,1,power_law_1.2,1.6005695343017579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,balanced,0.226090669631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,1,power_law_1.2,1.6742015838623048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,1,power_law_1.2,1.771891212463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,balanced,0.22737600406010947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,1,power_law_1.2,1.9870719909667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,balanced,0.2278453310330709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,1,power_law_1.2,2.133932876586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,balanced,0.23055466016133627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,balanced,0.03699733316898346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,1,power_law_1.2,2.261081504821777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,balanced,0.23269865910212198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,balanced,0.036677333215872444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,1,power_law_1.2,2.502227210998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,balanced,0.23567465941111246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,balanced,0.05635733405749003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,balanced,0.08461866776148479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,balanced,0.24612800280253092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,balanced,0.1329813301563263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,balanced,0.24930665890375772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,balanced,0.13515200217564902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,1,power_law_1.2,2.6693824768066405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,balanced,0.25783999760945636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,balanced,0.13667200009028116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,balanced,0.13702399532000223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,balanced,0.2754559914271037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,balanced,0.13846400380134583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.2,2.684204864501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,balanced,0.2938026587168376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,power_law_1.01,0.04642559885978699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,balanced,0.13942933082580566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.2,3.2756542205810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,balanced,0.31546133756637573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,balanced,0.14155200123786926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,balanced,0.14403733611106873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.2,3.836134338378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,power_law_1.01,0.06112639904022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,balanced,0.34364267190297443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,balanced,0.1453493336836497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,power_law_1.01,0.09662719964981079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.2,4.497580718994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,balanced,0.1500746707121531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,power_law_1.01,0.11985280513763427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,balanced,0.4142666657765706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,balanced,0.04271999994913737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.2,5.456620788574218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,balanced,0.15502933661142984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,power_law_1.01,0.18855040073394774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,balanced,0.04432533184687296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,balanced,0.15987199544906616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.2,7.363820648193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,balanced,0.056032001972198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,balanced,0.4609920183817546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,power_law_1.01,0.20110719203948973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,balanced,0.16821332772572836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,balanced,0.0857919951279958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.2,9.300339508056641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,power_law_1.01,0.20245759487152098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,balanced,0.1352000037829081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,balanced,0.18332799275716147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,power_law_1.01,0.20993919372558595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,balanced,0.1351626714070638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,balanced,0.14108799894650778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,balanced,0.20188800493876138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.2,13.226194763183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,power_law_1.01,0.21836159229278565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,balanced,0.6242186625798544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,balanced,0.14134933551152548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,power_law_1.01,0.225382399559021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,balanced,0.23003733158111572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,balanced,0.1416373352209727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,power_law_1.01,0.22860798835754395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.2,17.407545471191405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,balanced,0.14485333363215128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,balanced,0.1483680009841919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,balanced,0.2542293270428975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,power_law_1.01,0.2255295991897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,balanced,0.7886880238850912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,balanced,0.15245866775512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,power_law_1.01,0.03937279880046844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,power_law_1.01,0.23326079845428466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.2,21.268141174316405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,balanced,0.1546026666959127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,balanced,0.3359573284784953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,power_law_1.01,0.2498624086380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,power_law_1.01,0.051481598615646364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,balanced,0.1618773341178894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,power_law_1.01,0.06651520133018493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,power_law_1.01,0.26134400367736815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,power_law_1.01,0.08057600259780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,balanced,0.39635733763376874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,1,power_law_1.2,34.627777099609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,power_law_1.01,0.2742784023284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,power_law_1.01,0.11649919748306274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,power_law_1.01,0.2981120109558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,balanced,1.1291999816894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,power_law_1.01,0.12360960245132446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,power_law_1.01,0.29852159023284913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,power_law_1.01,0.12908799648284913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,balanced,0.16909867525100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,power_law_1.01,0.3412928104400635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,balanced,0.5518826643625895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,power_law_1.01,0.1279360055923462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,balanced,0.17734932899475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,power_law_1.01,0.3795264005661011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,power_law_1.01,0.13178880214691163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,power_law_1.01,0.4632063865661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,power_law_1.01,0.13612159490585327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,1,power_law_1.2,68.54696044921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,power_law_1.01,0.5348288059234619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,power_law_1.01,0.1425279974937439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,power_law_1.01,0.7418623924255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,power_law_1.01,0.14665600061416625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,balanced,0.7153279781341553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,power_law_1.01,0.9388863563537597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,power_law_1.01,0.14743679761886597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,balanced,1.5074666341145833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,power_law_1.01,1.2576512336730956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,power_law_1.01,0.15603840351104736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,balanced,0.19543466965357462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,power_law_1.01,1.7324735641479492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,power_law_1.01,0.15887999534606934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,power_law_1.01,2.0552383422851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,balanced,0.22276800870895386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,power_law_1.01,0.17166719436645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,power_law_1.01,3.326630401611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,balanced,0.23796266317367554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,power_law_1.01,0.1953727960586548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,balanced,1.0434292952219646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,power_law_1.01,6.763072204589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,balanced,0.30643200874328613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,power_law_1.01,0.21537280082702637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,power_law_1.01,0.26010239124298096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,balanced,0.36346666018168133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,power_law_1.01,0.28395519256591795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,balanced,1.8570720354715984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,power_law_1.01,0.37253758907318113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,balanced,0.5347359975179037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,power_law_1.01,0.46489601135253905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,power_law_1.01,0.6661439895629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,power_law_1.01,0.04254719913005829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,balanced,1.3734505971272786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,power_law_1.01,0.8073535919189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,balanced,0.6401546796162924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,power_law_1.01,0.0449535995721817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,power_law_1.01,1.1332544326782226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,power_law_1.01,0.054054397344589236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,power_law_1.01,1.547276782989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,power_law_1.01,0.06854400038719177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,power_law_1.01,1.8478464126586913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,balanced,0.9374986489613851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,power_law_1.01,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,power_law_1.01,2.9104448318481446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,2,power_law_1.2,0.045817598700523376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,power_law_1.01,0.11796480417251587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,power_law_1.01,0.1242624044418335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,2,power_law_1.2,0.04083200097084046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,power_law_1.01,5.977964782714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,power_law_1.01,0.13137919902801515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,2,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,power_law_1.01,0.13464319705963135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,balanced,1.231007973353068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,2,power_law_1.2,0.08501759767532349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,power_law_1.01,0.13480960130691527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,balanced,1.702170689900716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,2,power_law_1.2,0.11679999828338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,power_law_1.01,0.1424831986427307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,power_law_1.01,0.15058560371398927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,2,power_law_1.2,0.18556159734725952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,balanced,2.9004907608032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,power_law_1.01,0.15597440004348756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,power_law_1.01,0.16885759830474853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,2,power_law_1.2,0.19487359523773193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,2,power_law_1.2,0.20984320640563964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,balanced,1.8088159561157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,power_law_1.01,0.17802879810333253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,2,power_law_1.2,0.21558399200439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,power_law_1.01,0.1816704034805298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,2,power_law_1.2,0.22422399520874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,2,power_law_1.2,0.23045759201049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,power_law_1.01,0.20113279819488525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,2,power_law_1.2,0.2311232089996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,power_law_1.01,0.23493759632110595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,2,power_law_1.2,0.23271679878234863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,power_law_1.01,0.2630784034729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,2,power_law_1.2,0.2444607973098755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,power_law_1.01,0.33832321166992185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,balanced,2.388319969177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,2,power_law_1.2,0.25292799472808836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,power_law_1.01,0.42838401794433595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,2,power_law_1.2,0.25564160346984866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,balanced,2.6753759384155273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,power_law_1.01,0.6099071979522706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,2,power_law_1.2,0.28244481086730955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,power_law_1.01,0.7444352149963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,2,power_law_1.2,0.31169919967651366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,power_law_1.01,1.067142391204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,2,power_law_1.2,0.3264575958251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,power_law_1.01,1.3327872276306152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,2,power_law_1.2,0.35792639255523684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,power_law_1.01,1.958745574951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,2,power_law_1.2,0.4054592132568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,2,power_law_1.2,0.473203182220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,power_law_1.01,2.718105506896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,2,power_law_1.2,0.580019187927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,power_law_1.01,3.5258113861083986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,2,power_law_1.2,0.7589824199676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,balanced,2.9685118993123374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,2,power_law_1.2,0.9198143959045411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,power_law_1.01,5.0863807678222654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,2,power_law_1.2,1.3718720436096192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,power_law_1.01,10.876140594482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,2,power_law_1.2,1.7373056411743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,2,power_law_1.2,2.289811134338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,balanced,5.682698567708333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,2,power_law_1.2,3.15097599029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,2,power_law_1.2,7.87852783203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,balanced,4.698426564534505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,balanced,5.140762646993001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,2,power_law_1.2,0.0381056010723114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,2,power_law_1.2,0.04020479917526245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,2,power_law_1.2,0.04862079918384552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,2,power_law_1.2,0.06496000289916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,2,power_law_1.2,0.07808640003204345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,2,power_law_1.2,0.11767040491104126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,2,power_law_1.2,0.12811520099639892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,balanced,9.31219228108724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,2,power_law_1.2,0.12674560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,2,power_law_1.2,0.13533439636230468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,2,power_law_1.2,0.137881600856781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,2,power_law_1.2,0.14216959476470947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,2,power_law_1.2,0.14468480348587037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,2,power_law_1.2,0.14999040365219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,2,power_law_1.2,0.04174720048904419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,2,power_law_1.2,0.14948480129241942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,2,power_law_1.2,0.1583295941352844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,2,power_law_1.2,0.04570240080356598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,balanced,0.03557866563399633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,2,power_law_1.2,0.16548479795455934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,2,power_law_1.2,0.052774399518966675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,balanced,0.04966933528582255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,2,power_law_1.2,0.17377279996871947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,2,power_law_1.2,0.06584960222244263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,balanced,0.07447466750939687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,2,power_law_1.2,0.20056960582733155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,balanced,0.12520000338554382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,2,power_law_1.2,0.0797760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,balanced,0.22173333168029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,2,power_law_1.2,0.2257920026779175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,2,power_law_1.2,0.12092800140380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,balanced,0.22485866149266562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,2,power_law_1.2,0.2640127897262573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,balanced,0.22559465964635214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,2,power_law_1.2,0.1254271984100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,2,power_law_1.2,0.30047359466552737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,balanced,0.2266026735305786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,2,power_law_1.2,0.13236479759216307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,balanced,0.22868265708287558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,2,power_law_1.2,0.39572479724884035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,2,power_law_1.2,0.13742079734802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,balanced,0.22764799992243448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,2,power_law_1.2,0.4805568218231201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,balanced,0.23153066635131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,2,power_law_1.2,0.1406399965286255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,2,power_law_1.2,0.6675007820129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,balanced,0.23463465770085654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,2,power_law_1.2,0.14764800071716308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,balanced,0.23772267500559488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,2,power_law_1.2,0.8051775932312012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,2,power_law_1.2,0.15545599460601806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,balanced,0.24143999814987183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,2,power_law_1.2,1.2937408447265626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,2,power_law_1.2,0.15857280492782594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,balanced,0.25123733282089233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,2,power_law_1.2,1.532908821105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,2,power_law_1.2,0.1725376009941101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,balanced,0.2539199988047282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,2,power_law_1.2,1.8968063354492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,balanced,0.267359991868337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,2,power_law_1.2,0.1783552050590515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,2,power_law_1.2,3.1546304702758787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,balanced,0.292303999265035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,2,power_law_1.2,0.19226880073547364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,balanced,0.3202613393465678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,2,power_law_1.2,6.746905517578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,balanced,0.3569440046946208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,2,power_law_1.2,0.19843839406967162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,2,power_law_1.2,0.23399679660797118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,balanced,0.3973653316497803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,2,power_law_1.2,0.2818432092666626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,balanced,0.5083786646525065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,2,power_law_1.2,0.3538111925125122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,2,power_law_1.2,0.4309247970581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,2,power_law_1.2,0.6257791996002198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,balanced,0.5949920018513998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,2,power_law_1.2,0.7486207962036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,2,power_law_1.2,1.1478591918945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,2,power_law_1.2,1.399123191833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,balanced,0.03802666564782461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,balanced,0.8376853466033936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,2,power_law_1.2,2.0981376647949217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,balanced,0.03852800031503042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,balanced,0.05810666580994924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,2,power_law_1.2,3.085772705078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,balanced,0.08633599678675334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,2,power_law_1.2,3.4812545776367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,balanced,0.13702399532000223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,balanced,1.0680480003356934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,balanced,0.1381653348604838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,2,power_law_1.2,5.798054504394531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,balanced,0.14139200250307718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,balanced,0.14127467075983682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,power_law_1.01,0.03314560055732727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,2,power_law_1.2,11.413030242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,balanced,0.0633546660343806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,balanced,0.1437173287073771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,power_law_1.01,0.041119998693466185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,balanced,0.06584533552328746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,balanced,0.1451520025730133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,power_law_1.01,0.060915201902389526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,balanced,1.5523573557535808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,balanced,0.07323733468850453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,balanced,0.14839999874432883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,power_law_1.01,0.08792319893836975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,balanced,0.09946133693059285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,balanced,0.1513759990533193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,power_law_1.01,0.11862399578094482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,balanced,0.14943466583887735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,balanced,0.15662399927775064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,power_law_1.01,0.18528000116348267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,balanced,0.15289066235224405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,balanced,0.15556800365447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,power_law_1.01,0.19578880071640015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,balanced,0.1613920032978058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,balanced,0.1586079994837443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,power_law_1.01,0.20785920619964598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,power_law_1.01,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,balanced,0.16995733976364136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,balanced,0.1618933379650116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,power_law_1.01,0.2089087963104248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,balanced,0.17676266034444174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,power_law_1.01,0.038387200236320494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,balanced,0.16602133711179098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,power_law_1.01,0.21537280082702637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,balanced,2.037738641103109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,balanced,0.1927573283513387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,power_law_1.01,0.051622402667999265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,balanced,0.17031466960906982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,power_law_1.01,0.22428159713745116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,power_law_1.01,0.06724479794502258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,balanced,0.21831466754277548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,balanced,0.17633599042892456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,power_law_1.01,0.2296447992324829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,power_law_1.01,0.08120959997177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,power_law_1.01,0.23922560214996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,balanced,0.18078400691350302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,balanced,0.24065599838892618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,power_law_1.01,0.11856640577316284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,power_law_1.01,0.25082879066467284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,balanced,0.19177599747975668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,power_law_1.01,0.12474240064620971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,balanced,0.2858720024426778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,power_law_1.01,0.25839359760284425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,power_law_1.01,0.1324735999107361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,power_law_1.01,0.2795711994171143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,power_law_1.01,0.13653119802474975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,balanced,0.3261813322703044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,power_law_1.01,0.27114880084991455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,power_law_1.01,0.13841919898986815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,balanced,2.536154588063558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,power_law_1.01,0.3084480047225952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,balanced,0.20653333266576132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,power_law_1.01,0.14855680465698243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,balanced,0.4533119996388753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,power_law_1.01,0.32992000579833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,balanced,0.21255467335383096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,power_law_1.01,0.15315840244293213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,power_law_1.01,0.374566388130188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,power_law_1.01,0.15802240371704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,balanced,0.5446079969406128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,power_law_1.01,0.4367936134338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,power_law_1.01,0.16186879873275756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,power_law_1.01,0.5279488086700439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,power_law_1.01,0.17185920476913452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,power_law_1.01,0.18339200019836427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,power_law_1.01,0.6246784210205079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,balanced,0.24713067213694254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,power_law_1.01,0.19946240186691283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,balanced,0.787397305170695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,power_law_1.01,0.8490176200866699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,power_law_1.01,0.23018240928649902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,balanced,0.30051199595133465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,power_law_1.01,1.0958720207214356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,power_law_1.01,0.25423359870910645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,balanced,0.3405706485112508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,power_law_1.01,1.5766271591186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,power_law_1.01,0.3025727987289429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,power_law_1.01,0.35946879386901853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,balanced,1.0696640014648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,balanced,0.4583359956741333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,power_law_1.01,2.0885120391845704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,power_law_1.01,0.4679423809051514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,balanced,4.0531307856241865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,power_law_1.01,2.5846912384033205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,balanced,0.535093347231547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,power_law_1.01,0.5725312232971191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,power_law_1.01,0.053625601530075076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,power_law_1.01,4.009203338623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,power_law_1.01,0.8016703605651856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,balanced,0.8018773396809896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,power_law_1.01,0.06399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,power_law_1.01,1.037337589263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,power_law_1.01,8.427206420898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,power_law_1.01,0.0683135986328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,power_law_1.01,1.523142433166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,balanced,1.5882399876912434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,balanced,0.978378693262736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,power_law_1.01,0.081523197889328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,power_law_1.01,2.0192127227783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,power_law_1.01,0.09505919814109802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,power_law_1.01,2.5235712051391603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,power_law_1.01,0.13034240007400513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,balanced,1.432480017344157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,power_law_1.01,0.1412287950515747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,power_law_1.01,4.048563385009766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,power_law_1.01,0.14529279470443726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,power_law_1.01,0.1545024037361145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,power_law_1.01,8.563884735107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,balanced,2.119978745778402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,power_law_1.01,0.1627519965171814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,balanced,1.8972320556640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,power_law_1.01,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,power_law_1.01,0.17920639514923095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,power_law_1.01,0.18421119451522827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,power_law_1.01,0.20346879959106445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,balanced,2.803546587626139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,power_law_1.01,0.21701760292053224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,balanced,2.671653429667155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,power_law_1.01,0.23277440071105956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,power_law_1.01,0.249619197845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,balanced,8.05625089009603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,power_law_1.01,0.30529279708862306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,balanced,3.706965446472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,power_law_1.01,0.3692095994949341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,1,power_law_1.2,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,power_law_1.01,0.4812352180480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,power_law_1.01,0.5917888164520264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,1,power_law_1.2,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,1,power_law_1.2,0.05865600109100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,power_law_1.01,0.8112319946289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,1,power_law_1.2,0.08028159737586975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,power_law_1.01,1.0406399726867677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,1,power_law_1.2,0.11390719413757325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,power_law_1.01,1.4957311630249024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,1,power_law_1.2,0.19014400243759155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,power_law_1.01,1.9441471099853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,1,power_law_1.2,0.2029952049255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,power_law_1.01,2.8575807571411134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,1,power_law_1.2,0.21298561096191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,balanced,4.616421381632487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,balanced,4.257402737935384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,1,power_law_1.2,0.21616640090942382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,power_law_1.01,3.7598079681396483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,1,power_law_1.2,0.2175679922103882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,1,power_law_1.2,0.22526719570159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,power_law_1.01,4.6621246337890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,1,power_law_1.2,0.23388800621032715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,1,power_law_1.2,0.2413503885269165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,power_law_1.01,7.376377868652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,1,power_law_1.2,0.2618367910385132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,1,power_law_1.2,0.2651968002319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,power_law_1.01,14.583161926269531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,1,power_law_1.2,0.2817471981048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,1,power_law_1.2,0.2779328107833862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,1,power_law_1.2,0.31409919261932373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,1,power_law_1.2,0.3329472064971924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,1,power_law_1.2,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,1,power_law_1.2,0.3863231897354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,1,power_law_1.2,0.03818239867687225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,1,power_law_1.2,0.440934419631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,1,power_law_1.2,0.5391168117523193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,1,power_law_1.2,0.04575999975204468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,1,power_law_1.2,0.6505343914031982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,1,power_law_1.2,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,1,power_law_1.2,0.8664447784423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,1,power_law_1.2,1.104313564300537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,1,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,balanced,7.311210632324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,1,power_law_1.2,1.5991935729980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,1,power_law_1.2,0.12174079418182374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,1,power_law_1.2,2.095039939880371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,1,power_law_1.2,0.12874239683151245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,1,power_law_1.2,2.572902488708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,1,power_law_1.2,0.13492480516433716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,1,power_law_1.2,0.1376255989074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,1,power_law_1.2,3.981497573852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,1,power_law_1.2,0.14309120178222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,1,power_law_1.2,0.14734079837799072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,1,power_law_1.2,8.466162872314452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,1,power_law_1.2,0.15456639528274535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,1,power_law_1.2,0.16236799955368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,1,power_law_1.2,0.16561280488967894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,1,power_law_1.2,0.17475199699401855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,1,power_law_1.2,0.18250880241394044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,1,power_law_1.2,0.20008959770202636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,1,power_law_1.2,0.2321984052658081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,balanced,8.011813481648764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,1,power_law_1.2,0.2556159973144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,1,power_law_1.2,0.3061311960220337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,1,power_law_1.2,0.364300799369812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,1,power_law_1.2,0.4707776069641113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,1,power_law_1.2,0.5817599773406983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,1,power_law_1.2,0.8064319610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,1,power_law_1.2,1.0452095985412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,1,power_law_1.2,1.5408512115478517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,1,power_law_1.2,2.052998352050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,1,power_law_1.2,2.550457572937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,1,power_law_1.2,4.074035263061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,balanced,14.456245422363281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,1,power_law_1.2,8.6185791015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,1,power_law_1.2,0.053907197713851926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,1,power_law_1.2,0.06261759996414185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,1,power_law_1.2,0.06893439888954163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,1,power_law_1.2,0.07893760204315185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,balanced,0.0848479966322581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,1,power_law_1.2,0.08862079977989197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,balanced,0.12408533692359924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,1,power_law_1.2,0.13294719457626342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,balanced,0.21909334262212118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,balanced,0.41433600584665936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,1,power_law_1.2,0.1461184024810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,balanced,0.7959307034810384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,1,power_law_1.2,0.14732799530029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,balanced,0.8080053329467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,1,power_law_1.2,0.15480320453643798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,balanced,0.8156426747639974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,1,power_law_1.2,0.16083199977874757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,balanced,0.8069067001342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,balanced,0.8090559641520182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,1,power_law_1.2,0.1686911940574646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,balanced,0.8096373081207275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,1,power_law_1.2,0.1779904007911682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,balanced,0.8133973280588785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,1,power_law_1.2,0.18442239761352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,balanced,0.8194666703542074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,1,power_law_1.2,0.2032320022583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,balanced,0.8232426643371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,balanced,0.8304639657338461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,balanced,0.059989333152770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,1,power_law_1.2,0.21875200271606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,balanced,0.8560427029927572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,balanced,0.8649280071258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,balanced,0.08147733410199483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,1,power_law_1.2,0.23303039073944093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,balanced,0.12838400403658548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,balanced,0.8972586790720621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,balanced,0.22937599817911783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,balanced,0.9150079886118571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,1,power_law_1.2,0.2502912044525146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,balanced,0.42260265350341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,balanced,0.42931199073791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,1,power_law_1.2,0.30595200061798095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,balanced,0.9660267035166422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,balanced,0.43162135283152264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,1,power_law_1.2,0.36764159202575686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,balanced,1.0039626757303874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,balanced,0.4351573387781779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,1,power_law_1.2,0.4830592155456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,balanced,0.43632535139719647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,balanced,1.0488959948221843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,1,power_law_1.2,0.5921728134155273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,balanced,0.4403146505355835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,balanced,0.44248533248901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,1,power_law_1.2,0.815180778503418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,balanced,0.44979198773701984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,1,power_law_1.2,1.0379903793334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,balanced,1.2191627025604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,balanced,0.4533760150273641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,1,power_law_1.2,1.4892288208007813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,balanced,0.4607253472010295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,1,power_law_1.2,1.9312576293945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,balanced,0.46980265776316327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,balanced,1.3167146841684978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,balanced,0.4750346740086873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,1,power_law_1.2,2.840652847290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,balanced,0.490229328473409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,1,power_law_1.2,3.7388607025146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,balanced,0.5152479807535807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,balanced,1.7173706690470378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,1,power_law_1.2,4.630553436279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,balanced,0.551088015238444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,balanced,0.6005653142929077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,1,power_law_1.2,7.291686248779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,balanced,0.6465919812520345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,balanced,2.2278186480204263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,1,power_law_1.2,14.44019775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,balanced,0.7806399663289388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,balanced,0.05997333427270254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,balanced,0.08246933420499165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,balanced,0.9018133481343588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,balanced,0.1341759959856669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,balanced,0.2350239952405294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,balanced,3.3590027491251626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,balanced,0.4297226667404175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,balanced,1.2248319784800212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,balanced,0.434928019841512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,balanced,0.4408533175786336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,balanced,0.4427573283513387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,balanced,0.4487146536509196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,balanced,1.5374186833699544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,balanced,0.45160531997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,balanced,0.459386666615804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.12346880435943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,balanced,0.46772801876068115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,balanced,4.2665707270304365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,balanced,0.4752533435821533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.09786880016326904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,balanced,0.48679999510447186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.01,0.17956479787826538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.01,0.2884160041809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.01,0.4365824222564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,balanced,2.206570625305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.01,0.6793791770935058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.01,0.7247871875762939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.07950720191001892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,balanced,0.5034079949061075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.01,0.7266496181488037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,balanced,0.5147413412729899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.01,0.752396821975708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.01,0.7603456020355225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.09187840223312378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.01,0.7843967914581299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.17155840396881103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.01,0.788479995727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.01,0.22447359561920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,balanced,5.358352025349935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.01,0.8088768005371094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.01,0.36188158988952634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,balanced,2.9276854197184243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.01,0.8578304290771485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.01,0.37249279022216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.01,0.8639039993286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.01,0.4001023769378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.01,0.8981887817382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.01,0.40378880500793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.01,0.944371223449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.01,0.4084799766540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.01,1.0632448196411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,balanced,0.5474933385848999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.01,0.42737278938293455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.01,1.0004672050476073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.01,1.1036031723022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.01,0.44488959312438964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,balanced,0.6012586752573649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.01,1.1942848205566405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.01,0.4518080234527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,balanced,0.6544586817423502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.01,1.5045951843261718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.01,0.44798078536987307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.01,1.7344127655029298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,balanced,0.7731413046518961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.01,0.48321919441223143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.01,2.3139007568359373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,balanced,3.697178522745768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.01,0.4928768157958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,2,power_law_1.2,0.12376320362091064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.01,2.9199039459228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,balanced,0.8771680196126302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.01,0.506105613708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,2,power_law_1.2,0.0794048011302948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.01,4.1404670715332035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.01,0.5611455917358399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,2,power_law_1.2,0.1813248038291931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.01,5.101766586303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,balanced,1.2759573459625244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,0.6020544052124024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,balanced,7.71131706237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,2,power_law_1.2,0.2584127902984619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,power_law_1.01,0.08867200016975403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,0.6706943988800049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.01,5.969388961791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,2,power_law_1.2,0.3443648099899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,0.733676815032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,power_law_1.01,0.08870400190353393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,balanced,1.462015946706136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.01,9.418041229248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,2,power_law_1.2,0.6670015811920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,0.8851648330688476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,power_law_1.01,0.1085055947303772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,2,power_law_1.2,0.7180543899536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,1.0503104209899903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,power_law_1.01,0.1602560043334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.01,17.403750610351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,2,power_law_1.2,0.7514688014984131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,power_law_1.01,0.23149440288543702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,1.5037055969238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,balanced,2.1280852953592935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,2,power_law_1.2,0.7630335807800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,power_law_1.01,0.35749120712280275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,1.835807991027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,2,power_law_1.2,0.7956031799316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,power_law_1.01,0.38103680610656737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,2.6418432235717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,2,power_law_1.2,0.7883135795593261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,power_law_1.01,0.3999488115310669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,balanced,5.380767822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,3.3019710540771485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,2,power_law_1.2,0.8271552085876465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,power_law_1.01,0.4035967826843262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,balanced,2.836602528889974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,2,power_law_1.2,0.8322688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,power_law_1.01,0.4181951999664307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.01,4.088787078857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,2,power_law_1.2,0.8161343574523926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,power_law_1.01,0.4635647773742676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,2,power_law_1.2,0.9055551528930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.01,5.828031921386719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,power_law_1.01,0.4709440231323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,2,power_law_1.2,0.91909761428833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,power_law_1.01,0.5014272212982178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,2,power_law_1.2,0.9729920387268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.01,12.836370849609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,power_law_1.01,0.5223040103912353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,2,power_law_1.2,1.05796480178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,balanced,4.207994778951009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,2,power_law_1.2,0.999027156829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,2,power_law_1.2,1.1242112159729003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,power_law_1.01,0.5290431976318359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,2,power_law_1.2,1.229478359222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,power_law_1.01,0.550105619430542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,2,power_law_1.2,1.5093503952026368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,2,power_law_1.2,1.7741056442260743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,power_law_1.01,0.5616064071655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,power_law_1.01,0.6595392227172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,2,power_law_1.2,2.5288000106811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,balanced,5.68284289042155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.01,0.7652544021606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,2,power_law_1.2,3.1585151672363283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.01,0.9032256126403808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,2,power_law_1.2,4.498969650268554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,balanced,15.083343505859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.01,1.095423984527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,2,power_law_1.2,5.260927963256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.01,1.4800704002380372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,2,power_law_1.2,6.816441345214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.01,1.7570816040039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.01,2.5892608642578123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,2,power_law_1.2,9.203231811523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.01,3.4646526336669923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,balanced,7.090410868326823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.01,5.054694366455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,2,power_law_1.2,17.627212524414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,balanced,11.209354400634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.01,6.717222595214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,power_law_1.01,8.024486541748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,power_law_1.01,12.260678100585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.07831040024757385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.07048959732055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,power_law_1.01,26.240927124023436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.09994239807128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.1453760027885437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.20793600082397462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,balanced,11.322437286376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,2,power_law_1.2,0.3508352041244507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,2,power_law_1.2,0.40161919593811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,2,power_law_1.2,0.3931071996688843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,2,power_law_1.2,0.40523519515991213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,2,power_law_1.2,0.4205887794494629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,2,power_law_1.2,0.4444608211517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,2,power_law_1.2,0.43683838844299316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,2,power_law_1.2,0.456441593170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,2,power_law_1.2,0.47609601020812986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,2,power_law_1.2,0.5028160095214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,2,power_law_1.2,0.5193408012390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,2,power_law_1.2,0.5075712203979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,2,power_law_1.2,0.5800384044647217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,0.5929664134979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,0.6945151805877685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,0.7717631816864013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,0.9640512466430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,1.124019241333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,1.4544320106506348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,1.953446388244629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,3.1253631591796873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,balanced,22.780052185058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,3.803014373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,2,power_law_1.2,4.599846267700196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,2,power_law_1.2,7.060018920898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,2,power_law_1.2,13.775021362304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,2,power_law_1.2,0.08823680281639099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,2,power_law_1.2,0.06823679804801941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,2,power_law_1.2,0.101363205909729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,2,power_law_1.2,0.15193599462509155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,2,power_law_1.2,0.19763840436935426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,2,power_law_1.2,0.3619584083557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,2,power_law_1.2,0.39669759273529054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,2,power_law_1.2,0.4269567966461182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,2,power_law_1.2,0.434335994720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,2,power_law_1.2,0.4222911834716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,2,power_law_1.2,0.46082558631896975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,2,power_law_1.2,0.4777535915374756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,2,power_law_1.2,0.5047616004943848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,2,power_law_1.2,0.5402304172515869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,balanced,0.08502933382987976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,2,power_law_1.2,0.5327807903289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,balanced,0.12505599856376648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,2,power_law_1.2,0.5614208221435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,balanced,0.22350933154424033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,balanced,0.4212799866994222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,balanced,0.8015893300374349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,2,power_law_1.2,0.5725887775421142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,balanced,0.8076746463775635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,2,power_law_1.2,0.6867263793945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,balanced,0.06029866635799408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,balanced,0.8090240160624186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.2,0.7845888137817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,balanced,0.8169439633687338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,balanced,0.08109333117802937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.2,0.928486442565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,balanced,0.12986666957537332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.2,1.1354751586914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,balanced,0.8200000127156576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.2,1.5252032279968262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,balanced,0.2299893299738566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.2,1.957881546020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,balanced,0.42934401830037433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,balanced,0.8212587038675944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.2,2.7727615356445314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,balanced,0.44047999382019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,balanced,0.8281333446502686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.2,3.593958282470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,balanced,0.43878400325775146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,balanced,0.8387146790822347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.2,5.320473480224609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,balanced,0.44154131412506104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,balanced,0.4463733434677124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,balanced,0.8444266319274902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.2,6.92449951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,balanced,0.44940801461537677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,balanced,0.8540053367614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,2,power_law_1.2,9.689087677001954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.07437440156936645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,balanced,0.45557332038879395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,balanced,0.45954668521881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,balanced,0.8826826413472494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.08865280151367187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,2,power_law_1.2,14.327949523925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,balanced,0.46857066949208576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.1674239993095398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,balanced,0.8940906524658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,balanced,0.4792853196461995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.2872191905975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,balanced,0.9087039629618326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,2,power_law_1.2,27.508551025390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,balanced,0.4917173385620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.38202879428863523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,balanced,0.9533119996388754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,balanced,0.5007786750793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.6805568218231202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,balanced,0.07508799930413564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.7056575775146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,balanced,0.5293013254801432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,balanced,1.0225333372751872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,balanced,0.0940106709798177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.7421887874603271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,balanced,0.1411893367767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,balanced,0.5761866569519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,balanced,1.098352034886678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,balanced,0.2421226700146993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.7490816116333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,balanced,0.6062346696853638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,balanced,0.43182400862375897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.7777919769287109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.055232000350952146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,balanced,0.4402453502019246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,balanced,0.6853919823964437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,balanced,1.172869364420573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.7864831924438477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,balanced,0.44784533977508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.06311039924621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,balanced,0.4524213473002116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.8043071746826171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.11278719902038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,balanced,0.7758239905039469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,balanced,0.45898667971293133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,balanced,1.3666826883951824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.15991679430007935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.810035228729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,balanced,0.46726401646931964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.21560959815979003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,balanced,0.971338669459025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.8686847686767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,balanced,0.4758666753768921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.01,0.3560319900512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,balanced,0.4879466692606608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,balanced,1.541935920715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.01,0.3821824073791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.8799039840698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,balanced,0.500495990117391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.01,0.3974720001220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,balanced,1.1531893412272136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,balanced,0.5174346764882406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.01,0.40998401641845705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.918489646911621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.01,0.42346878051757814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.9376768112182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.01,0.4341184139251709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,balanced,2.0380959510803223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.01,0.45639681816101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.01,1.0394368171691895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,balanced,1.5842986106872559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.01,0.47205119132995604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.01,0.4697984218597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.01,1.0388287544250487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,balanced,0.5400799910227457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.01,0.49309439659118653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.01,1.115775966644287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.01,0.5146624088287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,balanced,0.5624373356501261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.01,0.5269375801086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.01,1.2239680290222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,balanced,2.5696266492207847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.01,0.5899456024169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,balanced,2.040005366007487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.01,1.4994303703308105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,0.6335360050201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.7875839233398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,0.7188032150268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.01,2.4118911743164064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,0.8127424240112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,1.0197952270507813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.01,3.05545597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,balanced,0.62937064965566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,1.248192024230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.01,4.287648010253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,1.7302400588989257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,balanced,3.69708251953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,balanced,0.7289600372314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,balanced,2.978010813395182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,2.1684736251831054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.01,5.295846557617187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,balanced,0.8012053171793619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,3.120595169067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.01,6.548652648925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,balanced,1.0140693187713623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,4.048563385009766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.01,4.9302528381347654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,balanced,1.1840319633483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.01,9.627481842041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.01,7.672019195556641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,balanced,1.800597349802653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.01,19.932672119140626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,balanced,4.869061470031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,balanced,4.100495974222819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.01,16.38814697265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,balanced,2.1481226285298667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.07427840232849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.08227840065956116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,power_law_1.01,0.07816320061683654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.1606783986091614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,balanced,3.1442559560139975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,power_law_1.01,0.07870079874992371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.2569727897644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,power_law_1.01,0.1242751955986023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.3643775939941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,power_law_1.01,0.17493120431900025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.672870397567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,balanced,5.0512692133585615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,balanced,6.0533707936604815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,power_law_1.01,0.23636479377746583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,balanced,4.137333234151204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.7379456043243409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,power_law_1.01,0.3680959939956665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.7593855857849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,power_law_1.01,0.38806400299072263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,power_law_1.01,0.4147647857666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.7959743976593018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,power_law_1.01,0.42753920555114744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.7945216178894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,power_law_1.01,0.4517824172973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.8199551582336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,power_law_1.01,0.4670015811920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,balanced,6.261615753173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.8188223838806152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,power_law_1.01,0.4976960182189941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.8429696083068847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,power_law_1.01,0.521779203414917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.9124608039855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,power_law_1.01,0.562713623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.9466496467590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.984716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,power_law_1.01,0.5586559772491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.9692223548889161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,power_law_1.01,0.5994880199432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,1,power_law_1.2,1.0709568023681642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,balanced,7.766165415445964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,balanced,9.449109395345053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,balanced,8.357583999633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,1,power_law_1.2,1.0630016326904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,power_law_1.01,0.6562111854553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,1,power_law_1.2,1.1493887901306152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,power_law_1.01,0.7796480178833007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,1,power_law_1.2,1.2998656272888183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.01,0.9009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,1,power_law_1.2,1.6296255111694335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.01,1.0895615577697755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.9121023178100587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.01,1.337235164642334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,1,power_law_1.2,2.5128320693969726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,1,power_law_1.2,3.1694208145141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.01,1.818547248840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,1,power_law_1.2,4.571680068969727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.01,2.3069055557250975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,balanced,10.50600560506185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.01,3.3015552520751954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,1,power_law_1.2,5.410105514526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.01,4.301023864746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,1,power_law_1.2,6.56842269897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.01,6.299084854125977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,1,power_law_1.2,9.811090850830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.01,8.251686096191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,power_law_1.2,20.498777770996092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.01,10.316121673583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.06229760050773621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.09664000272750854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,power_law_1.01,16.506623840332033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.18451839685440063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,1,power_law_1.2,0.3635263919830322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,1,power_law_1.2,0.37494399547576907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,1,power_law_1.2,0.4137087821960449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,power_law_1.01,32.87724914550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,1,power_law_1.2,0.42232961654663087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,balanced,16.52066167195638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,1,power_law_1.2,0.44117121696472167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,1,power_law_1.2,0.4625279903411865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,1,power_law_1.2,0.4746431827545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,1,power_law_1.2,0.496563196182251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,balanced,15.495984395345053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,1,power_law_1.2,0.4971968173980713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,1,balanced,19.50658671061198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,1,power_law_1.2,0.5065023899078369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,1,power_law_1.2,0.5330304145812989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,1,power_law_1.2,0.5426559925079346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,1,power_law_1.2,0.6067647933959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,0.6356736183166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,0.7365439891815185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,0.8351424217224122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,1.0455103874206544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,1.2812607765197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,1.733964729309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,2.207084846496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,3.1267135620117186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,4.015558242797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,1,power_law_1.2,4.940806579589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,1,power_law_1.2,7.725151824951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,1,power_law_1.2,16.256658935546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,balanced,34.42121124267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,balanced,0.18305067221323648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,balanced,0.28755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,balanced,0.5269920031229655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,1,power_law_1.2,0.07806079983711242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,balanced,1.0124639670054119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,balanced,1.9773707389831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,1,power_law_1.2,0.08364800214767457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,balanced,2.4666345914204917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,1,power_law_1.2,0.10467840433120727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,balanced,2.4746079444885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,1,power_law_1.2,0.15421439409255983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,balanced,2.4848853747049966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,1,power_law_1.2,0.19612159729003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,1,power_law_1.2,0.3804480075836182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,balanced,2.493504047393799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,1,power_law_1.2,0.39650559425354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,balanced,2.500218709309896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,1,power_law_1.2,0.4143104076385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,balanced,2.503023942311605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,1,power_law_1.2,0.44267520904541013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,1,power_law_1.2,0.4582528114318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,balanced,2.528879960378011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,1,power_law_1.2,0.47739520072937014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,balanced,2.5367466608683267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,1,power_law_1.2,0.5023615837097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,1,power_law_1.2,0.530131196975708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,balanced,2.5590133666992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,1,power_law_1.2,0.5705984115600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,balanced,2.5838987032572427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,balanced,2.598741372426351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,1,power_law_1.2,0.5712895870208741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,balanced,2.6378560066223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,1,power_law_1.2,0.6020480155944824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,balanced,2.683274586995443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,balanced,2.7553014755249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,1,power_law_1.2,0.6571519851684571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,1,power_law_1.2,0.7803647994995118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,balanced,2.967754681905111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.2,0.9041088104248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.2,1.10763521194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,balanced,3.020384152730306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.2,1.3459199905395507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.2,1.84769287109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,balanced,5.376373291015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.2,2.3280511856079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.2,3.3347904205322267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.2,4.326579284667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,balanced,3.407072067260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.2,6.312793731689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,balanced,0.11572266618410747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.2,8.283744049072265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,balanced,5.993237177530925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,balanced,0.1686026652654012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,balanced,0.293178657690684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.2,10.267935943603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,balanced,0.5468853314717611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,balanced,1.0500213305155437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,balanced,1.3082239627838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,1,power_law_1.2,16.397010803222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,balanced,1.3212587038675945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,balanced,5.791968027750651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,balanced,1.3161866664886475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,balanced,1.3226133187611897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,balanced,1.3282240231831868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,1,power_law_1.2,32.28997802734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,balanced,1.3350292841593425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,balanced,1.3391626675923665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,balanced,1.355493386586507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,balanced,7.431695938110352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,balanced,1.3692320187886555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,balanced,1.3852373758951824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,balanced,1.4007573127746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,balanced,1.43886931737264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,balanced,0.12294399738311768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,balanced,1.4614559809366863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,balanced,0.17268800735473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.01,0.2883392095565796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.01,0.1752128005027771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,balanced,0.3113119999567668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,balanced,1.5035840670267742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.01,0.4618368148803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,balanced,0.5308266480763754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.01,0.24161279201507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,balanced,10.467098871866861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,balanced,1.976901372273763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,balanced,1.007034699122111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.01,0.43451519012451173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.01,0.22734079360961915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,balanced,1.2512799898783367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.01,0.4203904151916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.01,0.6392064094543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,balanced,1.6595039367675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,balanced,1.259440024693807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.01,0.5444736003875732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.01,1.0871487617492677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,balanced,1.2670239607493083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.01,0.9488832473754882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,balanced,2.716597239176432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.01,1.8287424087524413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,balanced,1.2741173108418782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.01,1.0599616050720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.01,1.9059520721435548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,balanced,1.2819146315256755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,balanced,2.063418706258138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.01,1.106655979156494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,balanced,1.2943840026855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.01,2.0480064392089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.01,1.1397631645202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,balanced,1.3089653650919597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.01,2.133772850036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.01,1.079430389404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,balanced,1.3219679991404216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,balanced,11.281915028889975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,balanced,3.3839734395345054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.01,2.2304000854492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,balanced,1.3438612620035808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.01,1.236473560333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.01,2.2705408096313477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,balanced,1.3698773384094238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.01,1.3030079841613769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.01,2.500543975830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.01,1.3871871948242187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,power_law_1.01,0.18226560354232788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.01,2.503545570373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,balanced,3.5632425944010415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.01,1.3325887680053712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,power_law_1.01,0.27325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.01,2.4206592559814455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,power_law_1.01,0.22322559356689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.01,1.4466496467590333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,balanced,1.3913866678873699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.01,2.6657472610473634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,power_law_1.01,0.41329278945922854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.01,1.4851008415222169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.01,2.656358337402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,power_law_1.01,0.5896448135375977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.01,1.3899264335632324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,2,power_law_1.2,0.2874943971633911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.01,2.8489023208618165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,power_law_1.01,0.9514047622680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.01,1.5145279884338378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,balanced,5.198959986368815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,2,power_law_1.2,0.2050879955291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,power_law_1.01,1.0582592010498046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.01,3.2027584075927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.01,1.6499135971069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,balanced,1.4457227389017742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,power_law_1.01,1.0783679962158204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,2,power_law_1.2,0.3512768030166626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.01,3.1719871520996095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.01,1.8978431701660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,power_law_1.01,1.0776639938354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,2,power_law_1.2,0.6407104015350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.01,3.704121780395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.01,2.08536319732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,power_law_1.01,1.1786687850952149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,balanced,18.8176752726237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.01,2.522694396972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.01,4.200083160400391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,2,power_law_1.2,0.9997440338134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,power_law_1.01,1.2577919960021973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.01,2.654310417175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,2,power_law_1.2,1.7724224090576173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.01,5.241132736206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,power_law_1.01,1.3239168167114257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,balanced,8.879573186238607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,2,power_law_1.2,1.8937343597412108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.01,3.4272129058837892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,power_law_1.01,1.39552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.01,4.793913650512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,2,power_law_1.2,2.1008256912231444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,power_law_1.01,1.5260992050170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,balanced,1.5624426205952961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.01,4.177926254272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.01,5.916499328613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,2,power_law_1.2,2.217568016052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,power_law_1.01,1.6774784088134767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,balanced,1.655402660369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.01,5.606950378417968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.01,7.135257720947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,2,power_law_1.2,2.3385663986206056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,balanced,1.8345759709676106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.01,7.658399963378907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,2,power_law_1.2,2.3509567260742186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.01,10.206111907958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,power_law_1.01,1.5536512374877929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,2,power_law_1.2,2.4925312042236327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,balanced,2.0035093625386557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.01,9.928652954101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,2,power_law_1.2,2.585536003112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.01,13.866610717773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,power_law_1.01,1.7352447509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,2,power_law_1.2,2.5024320602416994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,balanced,9.227557500203451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,balanced,2.8803892135620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.01,13.891769409179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.01,17.756556701660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,2,power_law_1.2,2.7532800674438476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,2,power_law_1.2,2.764620780944824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,power_law_1.01,1.7349632263183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,balanced,3.242447853088379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,2,power_law_1.2,3.0240703582763673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.01,24.414906311035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.01,23.313145446777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.01,1.971628761291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,2,power_law_1.2,3.2883777618408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.01,2.1576000213623048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,2,power_law_1.2,3.355263900756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,balanced,4.943765322367351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.01,2.4863487243652345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,2,power_law_1.2,3.8208896636962892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.01,3.1446016311645506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.01,47.588461303710936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,2,power_law_1.2,4.525555038452149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.01,4.221855926513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,2,power_law_1.2,5.502463912963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,balanced,6.849285125732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.01,5.646585464477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,2,power_law_1.2,5.1754814147949215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.01,7.231180572509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,2,power_law_1.2,6.493753814697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,balanced,13.137120564778646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.01,10.413420867919921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,2,power_law_1.2,7.976627349853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,balanced,38.92405446370443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,2,power_law_1.2,11.555487823486327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.01,14.810758972167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,balanced,9.912815729777018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,2,power_law_1.2,15.839340209960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,power_law_1.01,17.12718048095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,2,power_law_1.2,19.339935302734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,power_law_1.01,32.24806518554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,2,power_law_1.2,26.207565307617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,balanced,13.833450317382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.17490559816360474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.1360703945159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,2,power_law_1.2,0.2315135955810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,power_law_1.01,66.54425048828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,2,power_law_1.2,45.693426513671874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,2,power_law_1.2,0.3575295925140381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,2,power_law_1.2,0.49129600524902345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,2,power_law_1.2,0.9233152389526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,2,power_law_1.2,1.0741120338439942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,2,power_law_1.2,1.1028351783752441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,2,power_law_1.2,1.1470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,2,power_law_1.2,1.1584256172180176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,balanced,16.74517822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,2,power_law_1.2,1.2825471878051757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,2,power_law_1.2,1.329683208465576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,2,power_law_1.2,1.4219776153564454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,2,power_law_1.2,1.3531455993652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,2,power_law_1.2,1.4566335678100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,balanced,24.36029815673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,2,power_law_1.2,1.5255104064941407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,2,power_law_1.2,1.411628818511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,2,power_law_1.2,1.5805888175964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,1.6700031280517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,2.023187255859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,2.1453887939453127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,2.716147232055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,2.7475967407226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,balanced,28.410016377766926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,3.457484817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,4.418764877319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,5.595347213745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,8.5342529296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,2,power_law_1.2,9.407718658447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,2,power_law_1.2,14.874649047851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,2,power_law_1.2,25.964767456054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,balanced,63.30353291829427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,2,power_law_1.2,0.183078396320343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,2,power_law_1.2,0.17037440538406373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,2,power_law_1.2,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,2,power_law_1.2,0.3725120067596436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,2,power_law_1.2,0.4568192005157471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,2,power_law_1.2,0.957049560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,balanced,0.1583093305428823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,2,power_law_1.2,1.034982395172119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,2,power_law_1.2,1.0610176086425782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,balanced,0.28446932633717853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,2,power_law_1.2,1.1417599678039552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,balanced,0.5302240053812662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,2,power_law_1.2,1.242739200592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,balanced,1.0051093101501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,balanced,1.9755573272705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,2,power_law_1.2,1.3086079597473144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,balanced,2.4798453648885093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,2,power_law_1.2,1.3888319969177245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,balanced,0.11569600303967793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,2,power_law_1.2,1.4679360389709473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,balanced,2.481930732727051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,balanced,0.16622400283813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,2,power_law_1.2,1.5684351921081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,balanced,2.4941652615865073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,balanced,2.4978507359822593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,2,power_law_1.2,1.6810815811157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,balanced,0.2869653304417928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,balanced,2.503925323486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,balanced,0.5353279908498129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,balanced,2.5200160344441733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,balanced,1.028656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,balanced,2.527594725290934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,2,power_law_1.2,1.6272384643554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,balanced,1.2820746898651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,balanced,2.543440024058024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,balanced,1.2897546291351318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,balanced,2.5518080393473306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,balanced,1.2911893526713054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,2,power_law_1.2,1.7344575881958009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,balanced,2.576373259226481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,balanced,1.3023467063903809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,balanced,2.670570691426595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,balanced,1.3029599984486897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,balanced,1.3256800174713135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,balanced,2.711125373840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,2,power_law_1.2,1.7908031463623046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,balanced,1.3239359855651855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,balanced,2.791989326477051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,balanced,1.3482507069905598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.2,2.0403392791748045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,balanced,0.14011733730634054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,balanced,1.3590453465779622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,balanced,2.839146614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.2,2.1394111633300783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,balanced,0.1851466695467631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,balanced,1.3870666821797688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.2,2.502022361755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,balanced,3.7248799006144204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.1757248044013977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,balanced,0.3232480088869731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,balanced,1.4091733296712239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.2,3.4842174530029295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,balanced,0.5460373163223267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,balanced,3.1214027404785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.25418241024017335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,balanced,1.4345547358194988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.2,3.984275054931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,balanced,1.0269386768341064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.4065408229827881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,balanced,1.2757813135782878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,balanced,1.7509652773539226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.2,5.526105499267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,balanced,4.663802782694499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,balanced,1.285797357559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.7311808109283447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,balanced,1.2981493473052979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,balanced,1.567072073618571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.2,7.650246429443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.9932479858398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,balanced,1.311077356338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.11600639820098876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,balanced,3.757040023803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,balanced,1.6717119216918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.01,1.828019142150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.2,10.894585418701173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,balanced,1.3181866804758708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.1476863980293274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.01,1.9039936065673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,balanced,1.3373066584269206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,balanced,1.8174452781677246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.01,0.22001280784606933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.2,16.13477783203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.01,2.117990493774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,balanced,1.3598240216573079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,balanced,6.1289011637369795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.01,0.3775360107421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,balanced,1.374853293100993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.01,2.115488052368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,balanced,2.542362689971924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.01,0.5637311935424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,2,power_law_1.2,21.87986602783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,balanced,1.413274606068929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.01,2.118976020812988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.01,0.9958335876464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,balanced,1.4582239786783855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.01,1.0616255760192872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.01,2.2095104217529298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,balanced,2.351184050242106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,balanced,6.47494379679362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.01,1.098316764831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.01,2.347500801086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,2,power_law_1.2,32.325497436523435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.01,1.1047167778015137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.01,2.3235136032104493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.01,1.163430404663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.01,2.483571243286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,balanced,3.660437266031901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,balanced,1.501167933146159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.01,1.2235775947570802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.01,2.541375923156738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.01,1.2483136177062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.01,1.2975232124328613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.01,2.6833791732788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,balanced,9.521296183268229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,2,power_law_1.2,74.66463012695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.01,1.3206208229064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.01,2.7038591384887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,balanced,4.032586733500163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.01,1.3577728271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,balanced,1.5716053644816081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.01,2.9187456130981446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.01,1.4088895797729493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.01,3.462201690673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.01,1.4604928016662597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.01,4.095731353759765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.01,1.5630144119262694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.01,4.2857921600341795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,1.651737594604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,balanced,5.530127843221028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,balanced,11.353771209716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,1.890105628967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.01,5.5722496032714846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,2.1307519912719726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.01,4.721734237670899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,balanced,1.7323360443115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,power_law_1.01,0.1401471972465515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,2.571219253540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,power_law_1.01,0.17685760259628297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.01,5.901875305175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,balanced,1.8684320449829102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,2.9360319137573243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,power_law_1.01,0.2353663921356201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,power_law_1.01,0.38957440853118896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.01,7.063442993164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,3.7524032592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,power_law_1.01,0.5281216144561768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,balanced,2.1658612887064614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,power_law_1.01,0.9485695838928223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,4.504204940795899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.01,9.548063659667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,power_law_1.01,1.0588800430297851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,balanced,7.546021143595378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,balanced,2.4562719662984214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,power_law_1.01,1.0744064331054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,6.241171264648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,power_law_1.01,1.1385600090026855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.01,13.933619689941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,balanced,12.2401974995931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,power_law_1.01,1.170150375366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,8.373043060302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,balanced,3.641530672709147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,power_law_1.01,1.2479743957519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.01,18.900314331054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,power_law_1.01,1.3291711807250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.01,10.38007049560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,power_law_1.01,1.422003173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,balanced,4.341349283854167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,power_law_1.01,1.5042367935180665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.17562240362167358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.01,21.03614044189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.01,15.797319030761718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,power_law_1.01,1.6499391555786134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.19514880180358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.34716799259185793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,balanced,9.003909428914389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.629414415359497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,power_law_1.01,1.6156991958618163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,balanced,6.578421274820964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.9392255783081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.01,26.386862182617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.01,45.599935913085936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,1,power_law_1.2,1.78222713470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,1,power_law_1.2,2.047161674499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,power_law_1.01,1.7044288635253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,1,power_law_1.2,2.1519487380981444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,1,power_law_1.2,2.13753604888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,balanced,8.83633041381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,1,power_law_1.2,2.216991996765137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,1,power_law_1.2,2.276095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,power_law_1.01,1.8662591934204102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,1,power_law_1.2,2.4222335815429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.01,2.100275230407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,balanced,22.990933736165363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,1,power_law_1.2,2.3755775451660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.01,2.3613887786865235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,1,power_law_1.2,2.4741823196411135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.01,2.7661632537841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,1,power_law_1.2,2.6083839416503904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.01,3.6077632904052734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,balanced,12.650032043457031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,1,power_law_1.2,2.698393630981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,1,power_law_1.2,2.8015935897827147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.01,4.529439926147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,1,power_law_1.2,3.0823808670043946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,balanced,16.196139017740887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.01,6.39738883972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,1,power_law_1.2,3.5914752960205076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.01,8.288217926025391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,1,power_law_1.2,4.2778881072998045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,1,power_law_1.2,4.493753433227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.01,12.31036148071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,1,power_law_1.2,5.568991851806641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,balanced,17.84115727742513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,1,power_law_1.2,4.833248138427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.01,16.295225524902342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,1,power_law_1.2,5.9830272674560545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.01,20.199980163574217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,1,power_law_1.2,7.238124847412109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,1,power_law_1.2,9.549305725097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,power_law_1.01,33.092864990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,1,power_law_1.2,14.782156372070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,1,power_law_1.2,18.100274658203126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,balanced,20.932783762613933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,1,power_law_1.2,21.06829376220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,power_law_1.01,67.00863647460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,power_law_1.2,44.337042236328124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,1,balanced,51.54291788736979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,balanced,27.47205861409505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,balanced,35.71368408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.10769920349121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.11779839992523193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,1,power_law_1.2,0.19879039525985717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,1,power_law_1.2,0.3385983943939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,1,power_law_1.2,0.46411519050598143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,1,power_law_1.2,0.9493760108947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,1,power_law_1.2,1.0504511833190917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,1,power_law_1.2,1.0744256019592284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,1,power_law_1.2,1.1330559730529786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,1,power_law_1.2,1.1655808448791505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,1,power_law_1.2,1.2381952285766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,1,power_law_1.2,1.2769920349121093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,1,power_law_1.2,1.3108736038208009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,1,power_law_1.2,1.3446080207824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,1,power_law_1.2,1.403878402709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,1,power_law_1.2,1.425984001159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,1,power_law_1.2,1.4745471954345704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,1,power_law_1.2,1.5933247566223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,balanced,73.22249348958333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,1.6915712356567383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,1.928825569152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,2.079136085510254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,balanced,0.17725332578023276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,2.4980224609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,balanced,0.26648000876108807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,1,power_law_1.2,0.1391808032989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,2.9211135864257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,balanced,0.5098079840342203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,balanced,0.9551253318786621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,1,power_law_1.2,0.15281280279159545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,3.7054271697998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,1,power_law_1.2,0.23303039073944093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,balanced,1.9088853200276692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,4.579014587402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,1,power_law_1.2,0.3669888019561768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,balanced,3.7983201344807944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,1,power_law_1.2,0.5059711933135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,6.270169448852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,1,power_law_1.2,0.9636735916137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,balanced,5.674191792805989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,1,power_law_1.2,1.0480575561523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,8.56561279296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,balanced,5.652751922607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,1,power_law_1.2,1.0580608367919921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,1,power_law_1.2,1.1662528038024902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,balanced,5.6953277587890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,1,power_law_1.2,10.50189437866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,1,power_law_1.2,1.2537856101989746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,balanced,5.7010345458984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,1,power_law_1.2,1.3081088066101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,balanced,5.559994379679362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,1,power_law_1.2,1.3988991737365724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,1,power_law_1.2,15.952557373046876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,balanced,5.596421559651692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,1,power_law_1.2,1.4580863952636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,1,power_law_1.2,1.5734784126281738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,balanced,5.612949371337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,1,power_law_1.2,1.7047296524047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,balanced,5.6044158935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,1,power_law_1.2,25.792056274414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,balanced,5.670965194702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,1,power_law_1.2,1.6695167541503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,balanced,5.678586959838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,balanced,5.713935852050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,1,power_law_1.2,1.7863679885864259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,balanced,5.778720219930013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,balanced,6.045045216878255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,1,power_law_1.2,1.8964672088623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.2,2.1454463958740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,balanced,6.2186024983723955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.2,2.392902374267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,balanced,6.250730514526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.2,2.837824058532715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,balanced,0.11051733295122783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.2,3.7124095916748048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,balanced,0.15727466344833374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,balanced,6.536640167236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,balanced,0.27057600021362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.2,4.611660766601562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,balanced,0.5014293193817139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,balanced,0.9557653268178304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.2,6.4603523254394535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,balanced,6.910341262817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,balanced,1.8690773646036785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,balanced,2.781205177307129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.2,8.367769622802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,balanced,2.7850612004597983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,balanced,2.793898582458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,balanced,7.277418772379558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.2,12.12750701904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,balanced,2.8080212275187173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,balanced,0.13989866773287454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.01,0.156550395488739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.01,0.29319679737091064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,balanced,2.812586784362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,balanced,0.18245333433151245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.2,16.126605224609374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.01,0.48853120803833006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,balanced,2.812938690185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.01,0.2698303937911987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,balanced,0.3280959924062093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,balanced,0.512608011563619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,balanced,2.855621337890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.01,0.9383808135986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,balanced,7.6481068929036455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.01,0.49647998809814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,balanced,0.9534880320231119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.2,20.07861785888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,balanced,2.8421653111775718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.01,0.3497024059295654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.01,0.7029056072235107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,balanced,1.8415946960449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,balanced,2.864037195841471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.01,0.7423808097839355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.01,1.4415679931640626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,balanced,2.719615936279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,balanced,2.8896268208821616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.01,1.0557951927185059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.01,2.2160768508911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,balanced,2.72708797454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,1,power_law_1.2,32.44035339355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,balanced,2.9191999435424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.01,1.303724765777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,balanced,2.7355521519978843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.01,2.6049728393554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,balanced,8.244453430175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,balanced,2.994314511617025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,balanced,2.743376096089681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.01,1.76561279296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.01,3.565407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,balanced,2.762159983317057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,balanced,3.053167978922526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.01,1.828927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.01,3.5270526885986326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,balanced,2.777887980143229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,balanced,3.1744372049967446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.01,1.8975103378295899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,1,power_law_1.2,66.01309204101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,balanced,2.790138562520345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.01,3.6631999969482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,balanced,3.2448161443074546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.01,2.0012287139892577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,balanced,2.815434773763021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.01,3.7060928344726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.01,2.0972288131713865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,balanced,2.8527199427286782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,balanced,3.427994728088379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.01,3.956095886230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.01,2.149702453613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,balanced,2.8792266845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,balanced,15.668485005696615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.01,4.13438720703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.01,2.3839359283447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,balanced,2.9387359619140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,balanced,3.6931838989257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.01,2.4709888458251954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.01,4.188556671142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,balanced,3.0642401377360025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.01,2.5840768814086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.01,4.43438720703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.01,2.525779151916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.01,4.517574310302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,balanced,4.045189221700032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.01,2.8417535781860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.01,4.571590423583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.01,2.8270847320556642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,balanced,3.166261355082194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.01,4.933561706542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.01,3.1968191146850584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,balanced,4.456111907958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,balanced,20.941722869873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.01,5.881235122680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.01,3.5357376098632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.01,6.896211242675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.01,4.28616943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.01,4.270374298095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.01,7.453056335449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.01,5.435078430175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,balanced,3.411866823832194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,balanced,5.1353333791097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.01,9.365286254882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.01,5.609785461425782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,balanced,3.6196425755818686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.01,8.067552185058593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.01,6.734413146972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,balanced,3.970149358113607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.01,10.08713607788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.01,8.995027160644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.01,9.448153686523437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.01,10.103123474121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,balanced,4.389781316121419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,balanced,6.948650360107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,power_law_1.01,0.2035072088241577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,power_law_1.01,0.3146687984466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.01,12.409024047851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.01,15.417823791503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,balanced,20.8931147257487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,power_law_1.01,0.5339968204498291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,balanced,5.139376004536946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,power_law_1.01,0.36165120601654055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,power_law_1.01,0.6997568130493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.01,19.091949462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.01,26.7371337890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,power_law_1.01,1.1017087936401366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,power_law_1.01,1.3170687675476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,power_law_1.01,1.6508991241455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,balanced,7.608992258707683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.01,24.797817993164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,power_law_1.01,1.834841537475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,power_law_1.01,1.918297576904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,balanced,8.755119959513346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,power_law_1.01,2.035487937927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,power_law_1.01,2.0619712829589845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.01,30.307192993164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,power_law_1.01,2.1635135650634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,2,power_law_1.2,0.2931519985198975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,power_law_1.01,2.3524736404418944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,balanced,9.569973627726236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,2,power_law_1.2,0.48839678764343264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,power_law_1.01,2.5642368316650392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,2,power_law_1.2,0.5420351982116699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,power_law_1.01,2.710310363769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,power_law_1.01,2.8932159423828123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.01,52.28395385742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,2,power_law_1.2,0.6552703857421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,power_law_1.01,3.595782470703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,2,power_law_1.2,1.2498559951782227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,2,power_law_1.2,1.780735969543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.01,3.4535873413085936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,2,power_law_1.2,2.1403776168823243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,balanced,13.66586176554362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,2,power_law_1.2,3.265331268310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.01,3.545894241333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,balanced,12.786229451497396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,2,power_law_1.2,3.4509502410888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.01,3.8840511322021483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,2,power_law_1.2,3.531417465209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.01,5.017228698730468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.01,4.897792053222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,2,power_law_1.2,3.816377639770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.01,6.417561340332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,2,power_law_1.2,3.911648178100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.01,8.251500701904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,balanced,39.63677215576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,2,power_law_1.2,3.989120101928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.01,11.491725158691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,balanced,18.79794692993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,2,power_law_1.2,4.23633918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.01,16.257420349121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,2,power_law_1.2,4.3584129333496096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,2,power_law_1.2,4.336352157592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,power_law_1.01,18.970912170410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,2,power_law_1.2,4.65681266784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,2,power_law_1.2,5.103897476196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,power_law_1.01,29.38672790527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,2,power_law_1.2,6.497811126708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,2,power_law_1.2,7.172601318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,power_law_1.01,60.9141845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,2,power_law_1.2,8.029151916503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,2,power_law_1.2,10.129740905761718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,balanced,28.55714162190755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,2,power_law_1.2,8.655654144287109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,2,power_law_1.2,0.15701760053634645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,2,power_law_1.2,10.540338897705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,2,power_law_1.2,0.269324803352356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,balanced,24.2444585164388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,2,power_law_1.2,10.68373794555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,2,power_law_1.2,0.2675391912460327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,2,power_law_1.2,0.33327360153198243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,2,power_law_1.2,14.451219177246093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,2,power_law_1.2,0.6570047855377197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,2,power_law_1.2,20.129362487792967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,2,power_law_1.2,0.9787455558776855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,2,power_law_1.2,1.147110366821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,2,power_law_1.2,1.6534143447875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,2,power_law_1.2,23.20335998535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,2,power_law_1.2,1.7863296508789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,2,power_law_1.2,1.7977088928222655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,2,power_law_1.2,30.66449890136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,2,power_law_1.2,1.9032127380371093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,2,power_law_1.2,1.985318374633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,2,power_law_1.2,2.121977615356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,2,power_law_1.2,2.3672256469726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,2,power_law_1.2,50.630859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,2,power_law_1.2,2.5020864486694334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,2,power_law_1.2,2.7354944229125975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,2,power_law_1.2,2.5601024627685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,2,power_law_1.2,3.039174461364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,2,power_law_1.2,2.9679168701171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,2,power_law_1.2,3.513292694091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,balanced,59.0404052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,2,power_law_1.2,3.7396480560302736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,2,power_law_1.2,4.432140731811524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,2,power_law_1.2,4.538361740112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,2,power_law_1.2,5.579558563232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,2,power_law_1.2,5.973075103759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,2,power_law_1.2,7.330796813964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,2,power_law_1.2,9.128787231445312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,2,power_law_1.2,10.868524932861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,2,power_law_1.2,0.20313599109649658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,2,power_law_1.2,14.612530517578126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,2,power_law_1.2,0.31300480365753175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,2,power_law_1.2,0.2967103958129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,balanced,0.1784800092379252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,2,power_law_1.2,28.3447998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,2,power_law_1.2,0.3750272035598755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,balanced,0.26709334055582684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,2,power_law_1.2,0.6540800094604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,balanced,0.4909653266270955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,2,power_law_1.2,0.8957440376281738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,balanced,0.9580639998118082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,2,power_law_1.2,1.1791872024536132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,balanced,1.8625706036885579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,2,power_law_1.2,1.6485055923461913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,balanced,3.6781387329101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,2,power_law_1.2,1.7324031829833983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,balanced,5.540063858032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,2,power_law_1.2,1.8572351455688476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,balanced,5.536223729451497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,2,power_law_1.2,1.9485248565673827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,balanced,5.519162495930989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,2,power_law_1.2,2.028454399108887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,balanced,5.535231908162435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,2,power_law_1.2,2.164531135559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,2,power_law_1.2,2.390278434753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,balanced,5.5574080149332685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,balanced,0.11294933160146077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,2,power_law_1.2,2.520992088317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,balanced,5.620794932047526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,balanced,0.1623146633307139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,2,power_law_1.2,2.6575103759765626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,balanced,0.2807733416557312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,balanced,5.611701329549153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,2,power_law_1.2,3.0430976867675783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,balanced,0.5203786691029867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,balanced,5.556970596313477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,balanced,1.00492262840271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,2,power_law_1.2,3.5577598571777345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,balanced,1.9688852628072102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,balanced,5.57974370320638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,balanced,2.9174985885620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,balanced,5.598938624064128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,balanced,2.904394785563151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.2,3.559571075439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,balanced,2.916207949320475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,balanced,5.655551910400391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,balanced,2.9489545822143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.2,3.6703678131103517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,balanced,2.9586613972981772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,balanced,5.746298472086589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,balanced,2.96122137705485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.2,4.184774398803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,balanced,6.0316956837972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,balanced,2.98201592763265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,balanced,3.0477011998494468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.2,5.2377983093261715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,balanced,6.2670135498046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,balanced,3.0644585291544595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.2,5.277753448486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,balanced,3.097615877787272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,balanced,0.18661866585413614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,balanced,6.463626861572266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,balanced,3.1246506373087564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.2,7.147513580322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.17597440481185914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,balanced,0.22531733910242716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,balanced,3.213472048441569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,balanced,0.3508426745732625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.2654400110244751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.2,8.544166564941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,balanced,3.244112014770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,balanced,6.839178721110026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,balanced,0.541381319363912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.49047040939331055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,balanced,0.9842346509297689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,balanced,3.3616161346435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.2,12.006432342529298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,balanced,1.873674710591634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.6097472190856934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,balanced,2.7652692794799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,balanced,7.13162104288737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,balanced,3.4687681198120117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.01,1.3354751586914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.2,15.809292602539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,balanced,2.776442527770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.01,2.096518325805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,balanced,2.784677187601725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,balanced,3.7546987533569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.01,2.5880191802978514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,balanced,2.8046719233194985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,2,power_law_1.2,22.650553894042968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,balanced,7.815802892049153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,balanced,2.821296056111654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.01,3.342252731323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,balanced,4.116522789001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,balanced,2.84989865620931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.01,3.544307327270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,balanced,2.870565414428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,2,power_law_1.2,34.150360107421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.01,3.6603134155273436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,balanced,2.9247306187947593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,balanced,4.7076107660929365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.11179519891738891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,balanced,8.471978505452475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.01,3.841971206665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,balanced,2.9813706080118814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.1587007999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,balanced,3.0235465367635093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.01,4.0282752990722654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.01,0.2726592063903809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,balanced,3.1111733118693032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.01,4.167724609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.01,0.32832000255584715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,balanced,5.301136016845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,2,power_law_1.2,65.0442626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,balanced,3.294677416483561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.01,0.7020031929016113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.01,4.287065505981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.01,1.0935423851013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.01,4.3768257141113285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.01,1.2721983909606933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,balanced,9.62767473856608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.01,1.7222015380859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.01,4.387295913696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.01,1.8154495239257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,balanced,3.459461212158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.01,4.665273666381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.01,1.9141376495361329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,balanced,6.643423716227214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.01,5.1673023223876955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.01,2.009119987487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.01,2.0701887130737306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.01,6.265331268310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.01,2.1860416412353514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.01,7.525971221923828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.01,2.3143871307373045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.01,2.2848831176757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,balanced,11.869253794352213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.01,7.215449523925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.01,2.4254655838012695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,power_law_1.01,0.1859328031539917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,balanced,3.8644320170084634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.01,2.5004032135009764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.01,8.969190216064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,power_law_1.01,0.24380159378051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,balanced,8.137114842732748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.01,2.710393524169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,power_law_1.01,0.35317120552062986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,balanced,4.1836748123168945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.01,7.8308349609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,3.2414974212646483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,power_law_1.01,0.39687039852142336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,3.7714305877685548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,power_law_1.01,0.7471295833587647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.01,9.318956756591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,balanced,4.798495928446452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,3.6820350646972657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,power_law_1.01,1.0824576377868653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,4.4025215148925785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.01,9.78243179321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,power_law_1.01,1.3349696159362794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,3.8883136749267577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,power_law_1.01,1.7222911834716796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,balanced,5.591040293375651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,balanced,14.649002075195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.01,12.289536285400391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,4.673836898803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,power_law_1.01,1.8191295623779298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,5.69233283996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,power_law_1.01,1.9404544830322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,balanced,10.12722651163737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.01,15.148390197753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,power_law_1.01,2.048748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,7.411532592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,balanced,6.8676802317301435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,power_law_1.01,2.1131967544555663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.17611520290374755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.01,18.972377014160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,9.180748748779298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,power_law_1.01,2.1981760025024415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.26566400527954104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.01,11.003475189208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,power_law_1.01,2.427174377441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.36903040409088134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.01,24.445753479003905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,balanced,10.699381510416666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,power_law_1.01,2.629452705383301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.6094272136688232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.01,15.634559631347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,power_law_1.01,2.786227226257324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,1,power_law_1.2,1.1258560180664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,power_law_1.01,3.072480010986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,1,power_law_1.2,1.7824832916259765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.01,32.94668884277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,1,power_law_1.2,2.299398422241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,power_law_1.01,3.6208065032958983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.01,60.136590576171876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,1,power_law_1.2,3.139743995666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,balanced,13.528170267740885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,1,power_law_1.2,3.2555007934570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,balanced,22.821734110514324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.01,3.727443313598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,balanced,15.160149892171225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,1,power_law_1.2,3.5452991485595704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,1,power_law_1.2,3.786259078979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.01,3.750233459472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,1,power_law_1.2,3.992006301879883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.01,4.398694229125977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,1,power_law_1.2,4.120627212524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.01,5.508492660522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,1,power_law_1.2,4.242329788208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,balanced,18.533584594726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.01,6.122560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,1,power_law_1.2,4.326950454711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,1,power_law_1.2,4.483865737915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.01,8.01638412475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,1,power_law_1.2,4.897619247436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.01,10.18853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,1,power_law_1.2,5.215526580810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,1,power_law_1.2,6.574342346191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.01,14.099623107910157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,1,power_law_1.2,7.737554931640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,1,power_law_1.2,7.632422637939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.01,18.762220764160155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,balanced,24.653477986653645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,1,power_law_1.2,9.401907348632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.01,22.974822998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,1,power_law_1.2,8.503302764892577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,1,power_law_1.2,10.222758483886718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,power_law_1.01,35.66520385742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,1,power_law_1.2,10.581747436523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,1,power_law_1.2,12.863449096679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,balanced,29.738441467285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,1,power_law_1.2,17.777439880371094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,balanced,44.13478088378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,power_law_1.01,71.46939697265626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,1,power_law_1.2,20.82072296142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,balanced,38.14634704589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,1,power_law_1.2,24.774246215820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,1,power_law_1.2,54.98304443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.11222399473190307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.15864319801330568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,1,power_law_1.2,0.18755840063095092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,1,power_law_1.2,0.32990078926086425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,1,power_law_1.2,0.620140790939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,1,power_law_1.2,1.0013440132141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,1,power_law_1.2,1.131276798248291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,1,power_law_1.2,1.65350399017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,1,power_law_1.2,1.7588415145874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,1,power_law_1.2,1.8249984741210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,1,power_law_1.2,1.9654720306396485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,1,power_law_1.2,2.0573888778686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,1,power_law_1.2,2.111520004272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,1,power_law_1.2,2.2593088150024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,1,power_law_1.2,2.337753677368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,1,power_law_1.2,2.3785791397094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,balanced,75.17171732584636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,1,power_law_1.2,2.485887908935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,1,power_law_1.2,2.788902473449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,3.40618896484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,3.88076171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,3.8057151794433595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,4.599795150756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,4.149990463256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,5.032320022583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,6.049516677856445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,1,power_law_1.2,0.1949952006340027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,balanced,0.09410666426022847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,7.719270324707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,1,power_law_1.2,0.24455039501190184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,1,power_law_1.2,0.29160959720611573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,9.619200134277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,1,power_law_1.2,0.3940160036087036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,balanced,0.11556800206502278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,1,power_law_1.2,0.6545599937438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,1,power_law_1.2,11.745369720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,1,power_law_1.2,0.9473471641540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,1,power_law_1.2,1.1659456253051759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,balanced,0.13061867157618204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,1,power_law_1.2,15.919577026367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,1,power_law_1.2,1.6521984100341798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,1,power_law_1.2,1.723148727416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,1,power_law_1.2,32.17403564453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,balanced,0.1933120091756185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,1,power_law_1.2,1.827507209777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,1,power_law_1.2,1.9440832138061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,1,power_law_1.2,2.1058879852294923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,balanced,0.33432531356811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,1,power_law_1.2,2.1752063751220705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,power_law_1.01,0.10697599649429321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,balanced,0.335477352142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,1,power_law_1.2,2.3956031799316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,balanced,0.33724268277486164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,power_law_1.01,0.13608959913253785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,balanced,0.3373013337453206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,1,power_law_1.2,2.613177680969238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,power_law_1.01,0.11728639602661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,balanced,0.3385759989420573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,power_law_1.01,0.11745920181274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,1,power_law_1.2,2.765216064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,balanced,0.3404586712519328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,power_law_1.01,0.15998079776763915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,balanced,0.3425920009613037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,1,power_law_1.2,3.046143913269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,power_law_1.01,0.18008960485458375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,balanced,0.34326398372650146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,power_law_1.01,0.23968000411987306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,1,power_law_1.2,3.7416831970214846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,balanced,0.34697067737579346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,power_law_1.01,0.26143360137939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,2,power_law_1.2,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,power_law_1.01,0.2744064092636108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,2,power_law_1.2,0.1295807957649231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.2,3.758310317993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,power_law_1.01,0.28688640594482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,balanced,0.07036800185839336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,2,power_law_1.2,0.11358079910278321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,balanced,0.3766186634699504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,power_law_1.01,0.2930880069732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,2,power_law_1.2,0.11399680376052856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,balanced,0.379472017288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,power_law_1.01,0.2974720001220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,2,power_law_1.2,0.13572479486465455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,balanced,0.08965866764386494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.2,3.9448577880859377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,power_law_1.01,0.33374719619750975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,balanced,0.3810666799545288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,2,power_law_1.2,0.1661247968673706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,power_law_1.01,0.34431359767913816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.2,4.482892990112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,2,power_law_1.2,0.23694078922271727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,power_law_1.01,0.0698303997516632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,power_law_1.01,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,2,power_law_1.2,0.26842238903045657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,power_law_1.01,0.08733440041542054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.2,5.744121551513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,balanced,0.12072533369064331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,power_law_1.01,0.3859008073806763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,2,power_law_1.2,0.2619647979736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,power_law_1.01,0.09679359793663025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,balanced,0.1511733333269755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.2,6.236761474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,2,power_law_1.2,0.2845247983932495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,power_law_1.01,0.4223616123199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,balanced,0.4991413354873657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,power_law_1.01,0.13178240060806273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,balanced,0.19132800896962485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,2,power_law_1.2,0.30191359519958494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.2,8.226105499267579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,power_law_1.01,0.13598719835281373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,balanced,0.5044320027033488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,power_law_1.01,0.5626368045806884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,balanced,0.3426239887873332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,2,power_law_1.2,0.30180480480194094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,power_law_1.01,0.17804160118103027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,balanced,0.3434346516927083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,power_law_1.01,0.6356160163879394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,balanced,1.0289066632588704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.2,10.203756713867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,power_law_1.01,0.2404223918914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,2,power_law_1.2,0.3371135950088501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,balanced,0.34401599566141766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,power_law_1.01,1.190227222442627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,balanced,1.040613333384196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,power_law_1.01,0.25509119033813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,2,power_law_1.2,0.37763841152191163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,balanced,0.34594666957855225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,power_law_1.01,1.3586688041687012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.2,14.447456359863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,power_law_1.01,0.26702721118927003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,2,power_law_1.2,0.38896639347076417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,balanced,0.3468266725540161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,balanced,1.059338649113973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,power_law_1.01,1.5782400131225587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,power_law_1.01,0.2839423894882202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,balanced,0.3490346670150757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,2,power_law_1.2,0.41480321884155275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,power_law_1.01,1.897939109802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.2,18.42909393310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,power_law_1.01,0.28679039478302004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,balanced,1.0867466926574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,balanced,0.3509013255437215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,2,power_law_1.2,0.45233922004699706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,power_law_1.01,2.427027130126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,balanced,0.353279987970988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,2,power_law_1.2,0.6321856021881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,power_law_1.01,3.147385597229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,balanced,2.059002717336019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.2,22.881062316894532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,power_law_1.01,0.3145792007446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,balanced,0.3563786745071411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,2,power_law_1.2,0.6899199962615967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,power_law_1.01,4.284588623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,power_law_1.01,0.35288960933685304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,balanced,0.360586682955424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,2,power_law_1.2,1.3278464317321776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,power_law_1.01,5.343161773681641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,power_law_1.01,0.3923840045928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,balanced,2.1279199918111167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,balanced,0.36401065190633136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,2,power_law_1.2,1.4529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,power_law_1.01,0.42539520263671876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,1,power_law_1.2,36.200314331054685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,power_law_1.01,6.433452606201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,balanced,0.37055468559265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,2,power_law_1.2,1.793894386291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,power_law_1.01,0.4836287975311279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,balanced,0.40462934970855713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,power_law_1.01,0.5136064052581787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,power_law_1.01,9.94049301147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,2,power_law_1.2,1.9716991424560546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,balanced,3.131744066874186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,1,power_law_1.2,0.07035520076751708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,power_law_1.01,0.6004543781280518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,balanced,0.41198400656382245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,2,power_law_1.2,2.665260887145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,power_law_1.01,0.7365119934082032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,1,power_law_1.2,0.08721280097961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,power_law_1.01,17.994195556640626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,balanced,0.5411839882532755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,2,power_law_1.2,3.3245887756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,1,power_law_1.2,0.09770879745483399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,power_law_1.01,0.8736319541931152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,1,power_law_1.2,70.87893676757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,balanced,0.5553280115127563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,1,power_law_1.2,0.12659840583801268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,2,power_law_1.2,4.391936111450195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,power_law_1.01,1.6282432556152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,balanced,4.173002560933431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,1,power_law_1.2,0.12626559734344484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,power_law_1.01,1.8955007553100587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,2,power_law_1.2,5.605081558227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,balanced,1.1433227062225342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,power_law_1.01,2.431430435180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,1,power_law_1.2,0.1705407977104187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,power_law_1.2,6.460601806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,power_law_1.01,2.994688034057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,1,power_law_1.2,0.23260159492492677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,balanced,1.1727306842803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,1,power_law_1.2,0.2557248115539551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,power_law_1.01,4.085843276977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,power_law_1.2,11.229753875732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,1,power_law_1.2,0.266975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,balanced,2.2229812939961753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,power_law_1.01,5.124473571777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,2,balanced,5.162517229715983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,1,power_law_1.2,0.28146560192108155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,power_law_1.01,6.22105598449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,power_law_1.2,21.486361694335937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,1,power_law_1.2,0.29338879585266114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,balanced,2.281888008117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,power_law_1.01,9.496435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,1,power_law_1.2,0.30240640640258787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,1,power_law_1.2,0.33381760120391846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,power_law_1.01,18.23945007324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,1,power_law_1.2,0.3686464071273804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,balanced,3.3707412083943686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,1,power_law_1.2,0.41283202171325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,1,power_law_1.2,0.4483520030975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,2,balanced,8.275189081827799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,1,power_law_1.2,0.5050559997558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,1,power_law_1.2,0.5452223777770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,balanced,4.508847872416179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,1,power_law_1.2,0.6415359973907471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,1,power_law_1.2,0.8039999961853027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,1,power_law_1.2,0.9082816123962403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,1,power_law_1.2,1.7536703109741212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,1,power_law_1.2,2.0153087615966796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,balanced,5.618069330851237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,1,power_law_1.2,2.5561920166015626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,1,power_law_1.2,3.0726911544799806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,1,power_law_1.2,4.154540634155273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,balanced,0.072543998559316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,1,power_law_1.2,5.217939376831055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,2,balanced,16.40112559000651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,balanced,0.09429333607355754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,1,power_law_1.2,6.315398406982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,balanced,8.821119944254557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,1,power_law_1.2,9.596211242675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,balanced,0.11277332901954651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,power_law_1.2,18.524365234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,balanced,0.12896000345547995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,balanced,0.11742400129636128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,balanced,0.12458133697509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,balanced,0.12481600046157837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,balanced,0.12648533781369528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,1,balanced,17.56490707397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,balanced,0.12187199791272481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,balanced,0.12270933389663696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,balanced,0.12324266632397969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,balanced,0.15941333770751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,balanced,0.15945600469907126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,balanced,0.1604213317235311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,balanced,0.28543466329574585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,balanced,0.28757866223653156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,balanced,0.28859732548395794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,balanced,0.2926986614863078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,balanced,0.2974453369776408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,balanced,0.546122670173645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,balanced,0.5575733184814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,power_law_1.01,0.09857919812202454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,2,power_law_1.2,0.09026560187339783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,balanced,0.8107786973317465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,power_law_1.2,0.10527360439300537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,2,power_law_1.01,0.10266239643096924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,power_law_1.01,0.11151360273361206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,2,power_law_1.2,0.11066880226135253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,balanced,1.0665120283762615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,power_law_1.2,0.09512320160865784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,2,power_law_1.01,0.10087679624557495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,power_law_1.2,0.11546239852905274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,2,power_law_1.01,0.11201920509338378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,power_law_1.2,0.12350720167160034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,balanced,1.5840853055318196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,2,power_law_1.01,0.12382719516754151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,balanced,0.06919999917348225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,power_law_1.2,0.1258944034576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,2,power_law_1.01,0.12949759960174562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,power_law_1.2,0.13203200101852416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,2,power_law_1.01,0.1269376039505005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,balanced,2.1093600591023765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,power_law_1.2,0.14309760332107543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,balanced,0.08935999870300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,2,power_law_1.01,0.13309439420700073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,power_law_1.01,0.1392575979232788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,2,power_law_1.2,0.143340802192688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,power_law_1.01,0.06845440268516541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,power_law_1.01,0.14368640184402465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,2,power_law_1.2,0.1541759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,balanced,3.1215041478474936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,power_law_1.2,0.18305280208587646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,2,power_law_1.01,0.18619519472122192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,balanced,0.11847999691963196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,power_law_1.01,0.08125439882278443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,power_law_1.2,0.1803007960319519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,2,power_law_1.01,0.1895359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,balanced,0.14738667011260986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,power_law_1.01,0.09886080026626587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,power_law_1.2,0.1961408019065857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,power_law_1.01,0.0986303985118866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,2,power_law_1.01,0.19486080408096312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,balanced,0.11760532855987549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,power_law_1.2,0.35642879009246825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,power_law_1.01,0.11729919910430908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,balanced,0.1195093293984731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,2,power_law_1.01,0.3609600067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,balanced,4.14522139231364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,power_law_1.01,0.117740797996521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,power_law_1.2,0.3769216060638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,balanced,0.12025599678357442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,2,power_law_1.01,0.36696319580078124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,power_law_1.01,0.11816960573196411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,power_law_1.2,0.39806718826293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,balanced,0.12101333340009053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,power_law_1.01,0.11915520429611207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,2,power_law_1.01,0.3796351909637451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,power_law_1.2,0.48282880783081056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,power_law_1.01,0.13082239627838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,balanced,0.12138133247693379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,2,power_law_1.01,0.46701440811157224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,power_law_1.01,0.13661439418792726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,power_law_1.2,0.5666431903839111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,balanced,0.12237333257993062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,2,power_law_1.01,0.5371647834777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,power_law_1.01,0.15306240320205688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,balanced,0.12372266252835591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,power_law_1.2,0.6867199897766113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,balanced,5.165216128031413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,power_law_1.01,0.14927999973297118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,2,power_law_1.01,0.6756671905517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,balanced,0.122597336769104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,power_law_1.2,0.9246848106384278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,power_law_1.01,0.1587391972541809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,2,power_law_1.01,0.8106304168701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,balanced,0.12268799543380737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,power_law_1.01,0.17978880405426026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,power_law_1.2,1.181503963470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,balanced,0.12458667159080505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,power_law_1.01,0.2014400005340576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,2,power_law_1.01,1.2248576164245606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,power_law_1.2,1.5573504447937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,power_law_1.01,0.2270591974258423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,balanced,0.15221333503723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,power_law_1.01,0.241593599319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,2,power_law_1.01,1.4904383659362792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,balanced,0.16549866398175558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,power_law_1.2,2.2066368103027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,balanced,0.15410133202870688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,power_law_1.01,0.4419519901275635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,1,power_law_1.2,0.06823040246963501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,2,power_law_1.01,2.0502784729003904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,balanced,0.14334400494893393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,balanced,0.15711466471354166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,power_law_1.2,2.9211967468261717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,power_law_1.01,0.5095551967620849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,balanced,0.25970133145650226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,1,power_law_1.2,0.0813696026802063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,2,power_law_1.01,2.724345588684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,balanced,0.3102506597836812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,power_law_1.01,0.6395711898803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,power_law_1.2,3.8865215301513674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,balanced,0.26190932591756183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,balanced,8.189525604248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,1,power_law_1.2,0.09097599983215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,power_law_1.01,0.7712063789367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,balanced,0.2566506663958232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,balanced,0.3149706721305847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,2,power_law_1.01,4.663199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,power_law_1.2,6.629869079589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,balanced,0.2608799934387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,1,power_law_1.2,0.09763200283050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,power_law_1.01,1.0416255950927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,balanced,0.09673600395520528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,balanced,0.588154673576355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,balanced,0.263045330842336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,2,power_law_1.01,5.056467056274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,1,power_law_1.2,0.11541119813919068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,power_law_1.01,1.3302592277526855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,power_law_1.2,8.059910583496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,balanced,0.2590293288230896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,balanced,0.09516266981760661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,balanced,0.6008053223292033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,1,power_law_1.2,0.11747839450836181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,balanced,0.26748265822728473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,2,power_law_1.01,6.005977630615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,balanced,0.152837336063385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,power_law_1.01,1.8545663833618165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,balanced,0.26925865809122723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,1,power_law_1.2,0.12168960571289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,balanced,0.1565600037574768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,power_law_1.2,12.582681274414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,balanced,0.8871253331502279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,power_law_1.01,2.4026815414428713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,1,power_law_1.2,0.11891839504241944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,balanced,0.2717760006586711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,2,power_law_1.01,10.123788452148437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,balanced,0.15614400307337442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,balanced,0.15516266226768494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,1,power_law_1.2,0.12881920337677003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,balanced,0.2797386646270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,power_law_1.01,3.5094913482666015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,balanced,1.1681973139444988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,power_law_1.2,20.801356506347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,balanced,0.15587199727694193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,1,power_law_1.2,0.1388864040374756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,balanced,0.2812533378601074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,power_law_1.01,20.933074951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,power_law_1.01,4.6050048828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,balanced,0.15730667114257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,1,power_law_1.2,0.1533184051513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,balanced,0.2869759996732076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,balanced,0.15793599685033163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,balanced,1.7003413836161296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,balanced,0.3020106752713521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,1,power_law_1.2,0.14910080432891845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,power_law_1.01,5.7101184844970705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,balanced,0.1586186687151591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,balanced,0.3073280056317647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,1,power_law_1.2,0.16359039545059204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,balanced,0.16127467155456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,balanced,0.3039039969444275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,power_law_1.01,8.92003173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,1,power_law_1.2,0.1805567979812622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,balanced,2.275210698445638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,balanced,0.1620373328526815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,balanced,0.3683520158131917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,1,power_law_1.2,0.2021951913833618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,balanced,0.164410670598348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,balanced,0.38207467397054035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,2,balanced,16.36895497639974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,power_law_1.01,17.47783660888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,balanced,0.1662879983584086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,1,power_law_1.2,0.22942719459533692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,balanced,0.5520426829655966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,balanced,0.18488534291585287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,1,power_law_1.2,0.24846079349517822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,balanced,3.377706527709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,balanced,0.581061323483785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,balanced,0.18698134024937949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,1,power_law_1.2,0.46064000129699706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,balanced,0.18652800718943277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,balanced,0.81113068262736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,balanced,0.2226240038871765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,1,power_law_1.2,0.5096640110015869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,balanced,1.0021066665649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,balanced,0.24645866950352988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,1,power_law_1.2,0.6524288177490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,balanced,0.29574400186538696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,balanced,4.441216150919597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,1,power_law_1.2,0.7821375846862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,balanced,1.4474080403645833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,balanced,0.34620265165964764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,1,power_law_1.2,1.0393088340759278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,balanced,1.867813269297282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,balanced,0.49961066246032715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,1,power_law_1.2,1.3067456245422364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,1,power_law_1.2,1.869887924194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,balanced,0.5937973260879517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,balanced,2.7852160135904946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,1,power_law_1.2,2.403455924987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,balanced,5.5770721435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,balanced,0.8644906679789225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,1,power_law_1.2,3.4938430786132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,balanced,3.816351890563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,balanced,1.3225653171539307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,1,power_law_1.2,4.59552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,1,power_law_1.2,5.661439895629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,balanced,1.9358399709065754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,balanced,4.791237195332845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,power_law_1.2,8.90447998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,balanced,2.4953866004943848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,1,balanced,8.848288218180338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,power_law_1.2,17.75226287841797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,balanced,3.102698644002279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,balanced,8.394240061442057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,balanced,5.001301447550456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,balanced,16.776463826497395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,1,balanced,17.528143564860027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,balanced,9.525274912516275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.2532480001449585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.1407807946205139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.232806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.13151999711990356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.20690560340881348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.14104959964752198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.01,0.25397119522094724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.15415680408477783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.01,0.25394558906555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.15493119955062867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.01,0.2631040096282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.15927040576934814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.01,0.2837951898574829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.01,0.2737279891967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.1537343978881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.01,0.2893759965896606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.161900794506073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,balanced,0.08846400181452434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.01,0.37319040298461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.17369600534439086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.01,0.3473536014556885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,balanced,0.08866666754086812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,power_law_1.01,0.13082239627838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.01,0.4304192066192627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.17770880460739136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,balanced,0.14314132928848267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,power_law_1.01,0.12049920558929443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.01,0.46300158500671384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.173363196849823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,balanced,0.14665599664052328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.01,0.38652160167694094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,power_law_1.01,0.12013440132141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.19686399698257445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,balanced,0.14731733004252115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.01,0.4530176162719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,power_law_1.01,0.14632960557937622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,balanced,0.14900267124176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.19319679737091064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.01,0.48503680229187013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,power_law_1.01,0.1480064034461975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.01,0.45279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,balanced,0.15158399939537048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.24204800128936768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.01,0.6032576084136962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,power_law_1.01,0.15790079832077025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,balanced,0.1509813368320465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.2652928113937378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.01,0.6541247844696045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,power_law_1.01,0.17383040189743043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.3361407995223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.01,1.0022080421447754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,power_law_1.01,0.19440000057220458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.01,1.4440768241882325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.01,0.29053440093994143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,balanced,0.16024532914161682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.01,1.8556480407714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.01,0.3456959962844849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.01,2.0274431228637697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,balanced,0.16108266512552896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,power_law_1.01,0.17834240198135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,0.43566079139709474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.01,4.424812698364258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,power_law_1.01,0.19911680221557618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,0.5784063816070557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.01,6.135212707519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,0.7648191928863526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,4,power_law_1.2,0.2584831953048706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.01,9.486707305908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,0.9901887893676757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,4,power_law_1.2,0.21233279705047609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,1.515334415435791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,4,power_law_1.2,0.2327359914779663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.01,11.292813110351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,balanced,0.1583573321501414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,power_law_1.01,0.183404803276062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,4,power_law_1.2,0.2581376075744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,1.8473983764648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,4,power_law_1.2,0.2555455923080444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,balanced,0.16034666697184244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,power_law_1.01,0.20878078937530517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.01,13.015673828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,4,power_law_1.2,0.266374397277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,2.4833791732788084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,balanced,0.16408532857894897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,power_law_1.01,0.2073280096054077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,4,power_law_1.2,0.3144767999649048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,balanced,0.16639467080434164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,4.98803825378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,power_law_1.01,0.25742719173431394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,4,power_law_1.2,0.2719871997833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.01,21.815008544921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.129203200340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,4,power_law_1.2,0.32997119426727295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,5.645804977416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,4,power_law_1.2,0.34917120933532714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.11941759586334229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.01,7.439788818359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,4,power_law_1.2,0.36849279403686525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,4,power_law_1.2,0.4627647876739502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.15217920541763305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.01,36.721624755859374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,4,power_law_1.2,0.4606143951416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.01,12.35572509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.1541759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,4,power_law_1.2,0.40387840270996095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,balanced,0.1783626675605774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,power_law_1.01,0.2739775896072388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,4,power_law_1.2,0.40838398933410647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.15504640340805054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,balanced,0.18471999963124594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,power_law_1.01,0.26360321044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.01,24.244320678710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,4,power_law_1.2,0.454636812210083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,balanced,0.19150400161743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.1583295941352844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,power_law_1.01,0.3708672046661377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,balanced,0.09707199533780415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,4,power_law_1.2,0.5405824184417725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,balanced,0.2469066580136617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,power_law_1.01,0.5876351833343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.16480640172958375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,4,power_law_1.2,0.5946752071380615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,balanced,0.1462613344192505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,balanced,0.26314133405685425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.01,0.6223680019378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.1631999969482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,4,power_law_1.2,0.914361572265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,balanced,0.25123733282089233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,4,power_law_1.2,0.13109760284423827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.1675711989402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,4,power_law_1.2,1.0317055702209472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,balanced,0.25549866755803424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,4,power_law_1.2,0.12043520212173461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.17945599555969238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,4,power_law_1.2,1.4966848373413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,balanced,0.25572266181310016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,4,power_law_1.2,0.12065919637680053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.172326397895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,4,power_law_1.2,2.3045440673828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,balanced,0.2571360071500142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,4,power_law_1.2,0.14599679708480834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.2034303903579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,balanced,0.25777600208918255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,4,power_law_1.2,3.2021888732910155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,4,power_law_1.2,0.14854400157928466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.19550080299377443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,balanced,0.25890133778254193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,4,power_law_1.2,4.832761764526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.01,0.8776191711425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,balanced,0.40220801035563153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.2403968095779419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,balanced,0.26580266157786053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,4,power_law_1.2,0.16620800495147706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.01,1.3455424308776855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.2809983968734741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,4,power_law_1.2,5.6398273468017575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,balanced,0.2669653296470642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,balanced,0.5101226568222046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,4,power_law_1.2,0.18202240467071534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.35211520195007323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,balanced,0.2718186577161153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.01,1.8956287384033204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,balanced,0.7627092997233073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,4,power_law_1.2,0.29294719696044924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,4,power_law_1.2,8.666226959228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,4,power_law_1.2,0.18611840009689332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,balanced,0.2790880004564921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.01,2.7076671600341795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,4,power_law_1.2,0.3680000066757202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,balanced,0.28146666288375854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.01,3.869247817993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,4,power_law_1.2,11.266508483886719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,0.4299327850341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,balanced,1.0146293640136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,balanced,0.2892213265101115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,4,power_law_1.2,0.19452799558639527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,0.5502079963684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,balanced,0.2924853364626567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.01,5.241523361206054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,0.9821696281433105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,4,power_law_1.2,0.21056001186370848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,balanced,1.5308160781860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,4,power_law_1.2,13.121395874023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,balanced,0.29875733455022174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,1.2767359733581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.01,8.030662536621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,balanced,0.30824534098307294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,1.7841920852661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,balanced,2.0325279235839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,balanced,0.3550666570663452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,2.47576961517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,4,power_law_1.2,27.2144775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,4,power_law_1.2,0.18659199476242067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.01,11.259776306152343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,balanced,0.42421332995096844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,3.2613887786865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,4,power_law_1.2,0.20166399478912353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,balanced,3.0404052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,balanced,0.5951093435287476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,5.279788970947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,power_law_1.01,14.783865356445313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,4,power_law_1.2,0.217740797996521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,7.607654571533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,balanced,0.5251520077387491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,4,power_law_1.2,44.519073486328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,4,power_law_1.2,0.24608640670776366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,balanced,4.041621208190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,power_law_1.01,23.081663513183592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,4,power_law_1.2,7.5403587341308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,balanced,0.7630666891733805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,balanced,0.956933339436849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,4,power_law_1.2,13.95160369873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,4,power_law_1.2,0.24396159648895263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,balanced,5.062378565470378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,balanced,1.4159305890401204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,4,power_law_1.2,0.31568639278411864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,power_law_1.01,48.364767456054686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,4,power_law_1.2,0.4382080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,4,power_law_1.2,29.39246826171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,balanced,1.86628262201945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,4,power_law_1.2,0.6055359840393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.2,0.6091775894165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,balanced,8.267754872639975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,balanced,2.754624048868815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.2,0.9788479804992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,balanced,3.9576638539632163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.2,1.5160256385803224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.2,1.6655040740966798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.2,3.016409683227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,balanced,4.9394880930582685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.2,4.226937484741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,balanced,17.939776102701824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.2,5.521926498413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.2,8.880274963378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,balanced,8.10047976175944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.2,12.337305450439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,4,power_law_1.2,12.884658813476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,4,power_law_1.2,33.808038330078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,balanced,15.515850067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,4,power_law_1.2,56.24954833984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,balanced,0.06605333089828491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,balanced,0.09033600489298503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,balanced,0.14564800262451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,balanced,0.14984533190727234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,balanced,0.15067199865976968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,balanced,0.1513653298219045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,balanced,0.15317866206169128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,balanced,0.05570666491985321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,balanced,0.153957337141037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,balanced,0.08380800485610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,balanced,0.1546880006790161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,balanced,0.15653866529464722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,balanced,0.14036800463994345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,balanced,0.14446933070818582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,balanced,0.15853333473205566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,balanced,0.14460266629854837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,balanced,0.15991999705632529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,balanced,0.1467626690864563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,balanced,0.16173332929611206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,balanced,0.15090133746465048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,balanced,0.17056000232696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,balanced,0.15028267105420431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,balanced,0.1805973251660665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,balanced,0.18304532766342163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,balanced,0.19100799163182577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,balanced,0.2214133342107137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,balanced,0.2346293330192566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,balanced,0.15330132842063904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,balanced,0.30963732798894245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,balanced,0.1547040045261383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,balanced,0.3424266576766968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.01,0.08380159735679626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.01,0.12836480140686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,balanced,0.4912480115890503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.01,0.1010815978050232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.01,0.17455359697341918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,balanced,0.613754669825236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.01,0.10574719905853272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.01,0.1757696032524109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.01,0.2554624080657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.01,0.149017596244812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,balanced,0.8936853408813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.01,0.23411200046539307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.01,0.14917759895324706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,balanced,0.15916267037391663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.01,0.26036479473114016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.01,0.15459840297698973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,balanced,0.16181866327921549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,balanced,1.1696746349334717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,power_law_1.01,0.06591359972953796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.01,0.3000319957733154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,balanced,0.1660533348719279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.01,0.1594879984855652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,power_law_1.01,0.08877440094947815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,balanced,0.16981865962346396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.01,0.3019776105880737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.01,0.160697603225708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,balanced,1.7174453735351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,power_law_1.01,0.08906239867210389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.01,0.3154239892959595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.01,0.1638975977897644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,2,power_law_1.2,0.12899839878082275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,power_law_1.01,0.1428607940673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.01,0.3234944105148315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.01,0.16657279729843139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,2,power_law_1.2,0.1628864049911499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,power_law_1.01,0.14413440227508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,balanced,2.334719975789388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.01,0.3279871940612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.01,0.16837120056152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,balanced,0.1831573247909546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,2,power_law_1.2,0.17589759826660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,power_law_1.01,0.15731199979782104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.01,0.33303680419921877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.01,0.17884160280227662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,2,power_law_1.2,0.2547264099121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,balanced,0.1878933310508728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,power_law_1.01,0.1695296049118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.01,0.36335999965667726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,2,power_law_1.2,0.24447999000549317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,balanced,0.19899199406305948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.01,0.18069759607315064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,power_law_1.01,0.1757375955581665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,2,power_law_1.2,0.26065280437469485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,balanced,3.072922706604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.01,0.3498111963272095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,balanced,0.2656159996986389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,2,power_law_1.2,0.2930624008178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.01,0.1944383978843689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.01,0.37217280864715574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,balanced,0.28495466709136963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,2,power_law_1.2,0.3031487941741943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.01,0.20977919101715087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.01,0.38074240684509275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,2,power_law_1.2,0.32196478843688964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,power_law_1.01,0.17284480333328248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.01,0.20444800853729247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,2,power_law_1.2,0.33955199718475343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.01,0.3879551887512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,power_law_1.01,0.17807999849319459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,2,power_law_1.2,0.31296000480651853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.01,0.22351999282836915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.01,0.49658880233764646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,balanced,4.646959940592448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,2,power_law_1.2,0.34715518951416013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.01,0.27409279346466064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,balanced,0.42395734786987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,2,power_law_1.2,0.351148796081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.01,0.6462912082672119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.01,0.35394558906555174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,2,power_law_1.2,0.33987839221954347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,power_law_1.01,0.17643519639968872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,balanced,0.5511200030644735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.01,0.9567744255065918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,2,power_law_1.2,0.38541440963745116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.01,0.45444478988647463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,power_law_1.01,0.1776255965232849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.01,0.7820543766021728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,balanced,0.8469066619873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,2,power_law_1.2,0.37957119941711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.01,0.4948736190795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,power_law_1.01,0.18556159734725952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.01,1.2627519607543944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,2,power_law_1.2,0.3680448055267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,balanced,1.1333706378936768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.01,0.8175040245056152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,2,power_law_1.2,0.472979211807251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,power_law_1.01,0.2049407958984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.01,1.5882431983947753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,2,power_law_1.2,0.6367231845855713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,2,power_law_1.2,0.08428159952163697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.01,0.9681407928466796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,balanced,1.68558931350708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.01,2.714726448059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,2,power_law_1.2,0.913913631439209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,power_law_1.01,0.21982719898223876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.01,1.4271039962768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,2,power_law_1.2,0.9003264427185058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,2,power_law_1.2,0.10037120580673217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,balanced,9.03170649210612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.01,3.3611072540283202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,power_law_1.01,0.23390719890594483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,2,power_law_1.2,1.320633602142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.01,1.8608192443847655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,balanced,2.23690128326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,2,power_law_1.2,0.09510400295257568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,2,power_law_1.2,1.5575103759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,power_law_1.01,0.2654848098754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.01,4.952780914306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.01,2.923494338989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,2,power_law_1.2,0.14280320405960084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,2,power_law_1.2,2.4670976638793944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,power_law_1.01,0.3637439966201782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.01,6.086214447021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,2,power_law_1.2,3.166169548034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,2,power_law_1.2,0.14959360361099244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,balanced,3.351594607035319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,power_law_1.01,0.46254720687866213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.01,3.8881343841552733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,2,power_law_1.2,4.3359935760498045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,2,power_law_1.2,0.15384960174560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.01,7.7427520751953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.01,5.007916641235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,power_law_1.01,0.6529600143432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,2,power_law_1.2,0.15965440273284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,2,power_law_1.2,6.302643203735352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,balanced,4.472074508666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,power_law_1.01,0.9513216018676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.01,13.944563293457032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,2,power_law_1.2,0.1586303949356079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.01,7.164608001708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,2,power_law_1.2,8.826573181152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,power_law_1.01,1.1886079788208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,2,power_law_1.2,0.1629439949989319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,2,power_law_1.2,0.1642303943634033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,power_law_1.01,1.5849663734436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,2,power_law_1.2,12.867462158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.01,14.139558410644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.01,27.206304931640624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,balanced,5.5350290934244795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,2,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,2,power_law_1.2,0.16943360567092897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,power_law_1.01,2.5263423919677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,2,power_law_1.2,0.09441279768943786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,2,power_law_1.2,0.176256000995636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,2,power_law_1.2,0.08323839902877808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,2,power_law_1.2,25.683047485351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,power_law_1.01,3.4278209686279295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,2,power_law_1.2,0.17645440101623536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,2,power_law_1.2,0.13699840307235717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,power_law_1.01,4.605510330200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,2,power_law_1.2,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,2,power_law_1.2,0.1437440037727356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,2,power_law_1.2,0.20805120468139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,balanced,8.894805272420248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,power_law_1.01,6.979923248291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,2,power_law_1.2,0.1579200029373169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,2,power_law_1.2,0.2154752016067505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,2,power_law_1.2,0.16320639848709106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,power_law_1.01,8.278572845458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,2,power_law_1.2,0.23733119964599608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,2,power_law_1.2,0.1742591977119446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,2,power_law_1.2,0.2882303953170776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,power_law_1.01,14.862693786621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,2,power_law_1.2,0.3724544048309326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,2,power_law_1.2,0.1721984028816223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,2,power_law_1.2,0.4165184020996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,2,power_law_1.2,0.1743615984916687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,2,power_law_1.2,0.532748794555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,power_law_1.01,33.48910827636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,2,power_law_1.2,0.8307711601257324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,2,power_law_1.2,0.17581440210342408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,balanced,18.01962153116862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,2,power_law_1.2,1.0558591842651368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,2,power_law_1.2,0.18557440042495726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,2,power_law_1.2,0.18925440311431885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,2,power_law_1.2,1.417676830291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,2,power_law_1.2,0.21237120628356934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,2,power_law_1.2,2.071743965148926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,2,power_law_1.2,0.21150720119476318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,2,power_law_1.2,0.2322943925857544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,2,power_law_1.2,2.9702016830444338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,2,power_law_1.2,0.2873408079147339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,2,power_law_1.2,0.3699903964996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,2,power_law_1.2,3.8627902984619142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,2,power_law_1.2,0.4750976085662842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,2,power_law_1.2,5.370707321166992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,2,power_law_1.2,0.6764800071716308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,2,power_law_1.2,0.9287615776062011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,2,power_law_1.2,8.10483169555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,2,power_law_1.2,1.3915264129638671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,2,power_law_1.2,1.8213184356689454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,2,power_law_1.2,15.14755859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,2,power_law_1.2,2.475948715209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,2,power_law_1.2,3.793849563598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,2,power_law_1.2,6.161388778686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,2,power_law_1.2,7.76355209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,2,power_law_1.2,9.22767333984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,2,power_law_1.2,15.674368286132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,2,power_law_1.2,30.17145690917969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,balanced,0.09429333607355754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,balanced,0.13788800438245138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,balanced,0.25121599435806274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,balanced,0.25593600670496625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,balanced,0.2561279932657878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,balanced,0.25783467292785645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,balanced,0.25966399908065796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,balanced,0.26210665702819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,balanced,0.060191998879114784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,balanced,0.26612265904744464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,balanced,0.26678399244944256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,balanced,0.08767466743787129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,balanced,0.272602657477061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,balanced,0.14501866698265076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,balanced,0.27674667040507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,balanced,0.27666666110356647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,balanced,0.14889599879582724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,balanced,0.2924906611442566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,balanced,0.14900267124176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,balanced,0.2990880012512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,balanced,0.15050133069356283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,balanced,0.3025173346201579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,balanced,0.1525706648826599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,balanced,0.3182400067647298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,balanced,0.15345066785812378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,balanced,0.3852533499399821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,balanced,0.1557973325252533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,balanced,0.05594133337338766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.09937919974327088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,balanced,0.37624533971150714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,balanced,0.15637866655985513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.11537280082702636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,balanced,0.08259200056393941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,balanced,0.16140266259511313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,balanced,0.4855733315149943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.24232959747314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,balanced,0.13980266451835632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,balanced,0.1623093287150065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,balanced,0.556165337562561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.254911994934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,balanced,0.14409066239992777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,balanced,0.16451733311017355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.2606591939926147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,balanced,0.810533364613851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,balanced,0.1441386640071869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,balanced,0.17348267634709677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.27153279781341555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,balanced,0.14726932843526205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,balanced,0.18241600195566812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,balanced,1.0125333468119304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.27633280754089357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,balanced,0.1502400040626526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.01,0.058815997838973996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,balanced,0.18424000342686972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.2791935920715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,balanced,0.15145599842071533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,balanced,1.4969760576883953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,balanced,0.19252800941467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.01,0.0738048017024994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.28380799293518066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.2813888072967529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,balanced,0.24663466215133667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.01,0.09296000003814697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.29575679302215574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,balanced,2.084383964538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,power_law_1.01,0.05364480018615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,balanced,0.24678399165471396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.01,0.1443071961402893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.29825921058654786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,power_law_1.01,0.06629760265350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,balanced,0.31728533903757733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.01,0.14707839488983154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.3187455892562866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,balanced,0.1544373333454132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,power_law_1.01,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.34949119091033937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,balanced,3.043349266052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.01,0.14506239891052247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,balanced,0.3932853142420451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,balanced,0.15735999743143717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,power_law_1.01,0.14124159812927245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.3375999927520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.01,0.15396480560302733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,balanced,0.5627893209457397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,power_law_1.01,0.1366719961166382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.36470398902893064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.01,0.15427199602127076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,power_law_1.01,0.1502784013748169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.42736639976501467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,balanced,0.6659679810206095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,balanced,3.947632153828939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.01,0.156985604763031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,power_law_1.01,0.1606592059135437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.4688767910003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.01,0.16003199815750122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,power_law_1.01,0.16691839694976807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,balanced,0.9691786766052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.5749248027801513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.01,0.1630784034729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.697983980178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.01,0.16985599994659423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,balanced,4.864015897115071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.01,0.9212672233581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,balanced,1.3037707010904949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.08098559975624084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.01,0.16606080532073975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,power_law_1.01,0.16618880033493041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.01,1.1958335876464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,balanced,0.16176000237464905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.01,0.19405440092086793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.10965119600296021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,power_law_1.01,0.17386879920959472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.01,1.7005760192871093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,balanced,0.16548800468444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.01,0.20567679405212402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,balanced,1.8940107027689617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.01,2.127052879333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.13767679929733276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,balanced,0.17082132895787558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.01,0.2136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.2422271966934204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.01,3.184614372253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,balanced,0.17655466000239053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.01,0.21866240501403808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,power_law_1.01,0.1707136034965515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,balanced,7.721749623616536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.2542975902557373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.01,3.94634895324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,balanced,2.5032906532287598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.01,0.25313920974731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,power_law_1.01,0.17613439559936522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.24688000679016114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.01,0.2976576089859009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,power_law_1.01,0.1818560004234314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.05878400206565857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.01,4.937542343139649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,power_law_1.01,0.20617599487304689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.27199358940124513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.01,0.35190401077270506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.0769599974155426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,balanced,0.19459732373555502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.01,7.7657920837402346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,balanced,3.1282132466634116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.266592001914978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.01,0.43927679061889646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.08517760038375854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,power_law_1.01,0.20994560718536376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,balanced,0.20122667153676352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.01,0.5994559764862061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.2817919969558716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,power_law_1.01,0.22351999282836915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.14752639532089235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,balanced,0.21435733636220297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.01,15.652473449707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.01,0.7211904048919677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,power_law_1.01,0.25615999698638914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.28958721160888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.1447424054145813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,balanced,0.28356800476710003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,power_law_1.01,0.3162240028381348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.01,1.0334336280822753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.278931188583374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.14982399940490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,balanced,0.3113706707954407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.01,0.3760767936706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.01,1.3584704399108887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,balanced,15.540111541748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,balanced,4.917338689168294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.28815999031066897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.15559040307998656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.01,1.9465471267700196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.2947391986846924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.15488640069961548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.01,2.6587648391723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.34778239727020266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.15601919889450072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.01,0.56943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,balanced,0.47645866870880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.3443583965301514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.16003199815750122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.01,3.290911865234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.3471424102783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.01,0.7143424034118653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.16551680564880372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,balanced,0.6309279998143514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.01,4.926931381225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.39549438953399657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.01,1.0337920188903809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.16522879600524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,balanced,0.9433440367380778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.42778878211975097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.1699136018753052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.01,1.3170368194580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.01,9.385254669189454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.4664447784423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.1923135995864868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,balanced,1.254256010055542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.01,1.939743995666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,balanced,9.5076904296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.5913919925689697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.21004800796508788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.01,2.5686080932617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,balanced,1.8547520637512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.6769152164459229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.21139841079711913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.01,3.8308032989501952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,1,power_law_1.2,0.9552000045776368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.22458879947662352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,balanced,2.4608586629231772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.01,5.090975952148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,1,power_law_1.2,1.204633617401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.26060800552368163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.01,6.308870315551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,1,power_law_1.2,1.7028863906860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.2874687910079956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,balanced,3.665792147318522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,1,power_law_1.2,2.0898624420166017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,power_law_1.01,10.060256195068359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,0.35773439407348634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,1,power_law_1.2,3.1476160049438477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,0.440396785736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,power_law_1.01,20.09081573486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,balanced,4.882255872090657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,0.6035840034484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,1,power_law_1.2,4.000998306274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,0.7274623870849609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,1,power_law_1.2,4.965830230712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,1.045740795135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,balanced,6.101989110310872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,1.3368895530700684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,1,power_law_1.2,7.705619049072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,1.9202688217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,1,power_law_1.2,15.912063598632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,2.691859245300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,1,power_law_1.2,3.3336769104003907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,balanced,9.850837071736654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,1,power_law_1.2,4.936883163452149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,1,power_law_1.2,9.353113555908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,balanced,20.348730723063152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,1,power_law_1.2,0.05386880040168762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,balanced,0.23574932416280112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,1,power_law_1.2,0.06620799899101257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,balanced,0.22844799359639487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,1,power_law_1.2,0.07966079711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,balanced,0.42193599541982013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,balanced,0.15390933553377786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,1,power_law_1.2,0.14256639480590821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,balanced,0.4251733223597209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,1,power_law_1.2,0.1435263991355896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,balanced,0.13581333557764688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,balanced,0.4231040080388387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,1,power_law_1.2,0.15125759840011596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,balanced,0.2329919934272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,balanced,0.42256001631418866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,1,power_law_1.2,0.15679359436035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,balanced,0.2386080026626587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,balanced,0.4235039949417114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,1,power_law_1.2,0.16663680076599122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,balanced,0.42324264844258624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,balanced,0.23658132553100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,balanced,0.43593064943949383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,balanced,0.24084800481796265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,balanced,0.439248005549113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,balanced,0.2412053346633911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,balanced,0.4384426673253377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,1,power_law_1.2,0.16727039813995362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,balanced,0.4500693480173747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,balanced,0.24359466632207236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,balanced,0.45575467745463055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,1,power_law_1.2,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,balanced,0.24368532498677573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,balanced,0.4601653416951497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.01,0.3644927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,balanced,0.4897600015004476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,balanced,0.24612800280253092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.01,0.39555199146270753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,balanced,0.4912906487782796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,1,power_law_1.2,0.16726399660110475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,balanced,0.25018133719762164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,balanced,0.4929120143254598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.01,0.29723520278930665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,1,power_law_1.2,0.17681280374526978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,balanced,0.2487786610921224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,balanced,0.5871359904607137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.01,0.42110719680786135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,balanced,0.543722669283549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,1,power_law_1.2,0.17907840013504028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,balanced,0.25410133600234985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.01,0.4203904151916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,balanced,0.7994346618652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,balanced,0.2593119939168294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,1,power_law_1.2,0.20259199142456055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,balanced,0.8923892974853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.01,0.46443519592285154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,balanced,0.27882667382558185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,balanced,0.14632532993952432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.01,0.4573696136474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,balanced,1.2669386863708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,1,power_law_1.2,0.21495680809020995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,balanced,0.28008532524108887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,balanced,0.12764267126719156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,balanced,1.5077759424845378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,1,power_law_1.2,0.2178879976272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.01,0.4649343967437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,balanced,0.2851946751276652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,balanced,0.22476800282796225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,1,power_law_1.2,0.2457024097442627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.01,0.5162367820739746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,balanced,2.3091413180033364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,balanced,0.3189813296000163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,balanced,0.229312002658844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,1,power_law_1.2,0.3117120027542114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.01,0.5265279769897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,balanced,0.3314773241678874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,balanced,0.2294666568438212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,balanced,3.0107946395874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.2,0.3764928102493286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.01,0.5528448104858399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,balanced,0.23202133178710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,balanced,0.47605331738789874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.21827199459075927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,balanced,0.23515733083089194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.01,0.7270400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.2,0.5391424179077149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,balanced,0.5430986483891805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,balanced,4.577343940734863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.2145792007446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,balanced,0.23494933048884073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.01,0.8573696136474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.2,0.6872704029083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.19173760414123536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,balanced,0.760213295618693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.01,0.6457024097442627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.23623039722442626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.2,0.9869503974914551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.23539199829101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,power_law_1.01,0.22445440292358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.01,0.7363840103149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.2,1.2896512031555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,balanced,0.9303413232167562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,balanced,6.554245630900065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.24467198848724364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.2,1.9090496063232423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.01,0.7563456058502197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,power_law_1.01,0.2245568037033081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.2746687889099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,balanced,0.23571733633677164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,balanced,1.385957400004069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.2586047887802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.2,2.502809524536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.01,0.7831232070922851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,power_law_1.01,0.18529920578002929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,balanced,0.2374133268992106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.01,0.26657919883728026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.327129602432251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.01,0.2726272106170654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.2,3.71459846496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,power_law_1.01,0.22922239303588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.01,0.9953472137451171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,balanced,8.864789326985678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,balanced,1.8561333020528157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,4,power_law_1.2,0.3907455921173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.01,0.28883841037750246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.01,1.2652735710144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,power_law_1.01,0.23135359287261964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.2,4.964806365966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.01,0.2831167936325073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,4,power_law_1.2,0.33580799102783204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,power_law_1.01,0.2737344026565552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.01,0.3221695899963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.01,1.9745599746704101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,balanced,2.8040641148885093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.2,6.13804817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,4,power_law_1.2,0.4240128040313721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.01,0.37776639461517336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,power_law_1.01,0.2939136028289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.01,2.4217920303344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.01,0.4312448024749756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,4,power_law_1.2,0.41941118240356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,1,power_law_1.2,9.773484802246093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,power_law_1.01,0.33400959968566896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.01,0.5990655899047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,4,power_law_1.2,0.4445184230804443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,balanced,13.032538096110025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.01,2.955660820007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,balanced,0.24337067206700644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.01,0.43615360260009767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,balanced,3.473674774169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,4,power_law_1.2,0.45474557876586913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.01,0.4985983848571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,balanced,0.24580800533294678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.01,4.111481475830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,0.5859712123870849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,1,power_law_1.2,19.82332763671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,4,power_law_1.2,0.4622208118438721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,balanced,0.2510773340861003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,power_law_1.01,0.2939903974533081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,1.0118847846984864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.01,6.785414123535157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,4,power_law_1.2,0.4949376106262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,balanced,0.2542506655057271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,power_law_1.01,0.3140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,1.2018495559692384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,balanced,4.433877309163411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,4,power_law_1.2,0.5927040100097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,1.6718399047851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.01,8.962073516845702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,4,power_law_1.2,0.6191487789154053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,2.6138816833496095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,power_law_1.01,0.2788800001144409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,3.8877632141113283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,4,power_law_1.2,0.7711808204650878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.01,11.997113800048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,balanced,0.26890132824579877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,4.42303352355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,power_law_1.01,0.3122431993484497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,4,power_law_1.2,0.8245439529418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,balanced,0.27507199843724567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,power_law_1.01,0.3456063985824585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,7.225433349609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,4,power_law_1.2,0.6070208072662353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,balanced,27.64807891845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,balanced,7.336037317911784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.01,18.715589904785155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,balanced,0.2836906711260478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,power_law_1.01,0.35155200958251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,4,power_law_1.2,0.7769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,10.64103012084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,balanced,0.38577067852020264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,4,power_law_1.2,0.804691219329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,balanced,0.40720001856486004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,power_law_1.01,0.42072319984436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.01,26.769778442382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.01,12.519878387451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,4,power_law_1.2,0.7992127895355224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,balanced,0.6132106781005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,power_law_1.01,0.4356287956237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,4,power_law_1.2,0.9894335746765137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,power_law_1.01,0.4983232021331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.01,16.519334411621095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,balanced,0.7927626768747965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,4,power_law_1.2,1.3782208442687989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,power_law_1.01,0.9109056472778321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.01,38.36927490234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,4,power_law_1.2,1.5145536422729493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.01,1.0231871604919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,4,power_law_1.2,2.452614402770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,balanced,16.31233088175456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.01,1.4439295768737792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.01,42.851742553710935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,4,power_law_1.2,3.1262975692749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,balanced,1.194207986195882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.01,1.9446783065795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,4,power_law_1.2,4.116153717041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,balanced,1.5914079348246257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.01,3.605926513671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,4,power_law_1.2,6.3959297180175785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.01,83.88475341796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,balanced,2.40336004892985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.01,3.806137466430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,4,power_law_1.2,8.500109100341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.01,6.273689651489258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,balanced,3.185920079549154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,4,power_law_1.2,14.706137084960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.01,10.721158599853515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,balanced,4.815087954203288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,4,power_law_1.2,24.165773010253908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.01,10.877811431884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.01,17.722438049316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,balanced,6.479967753092448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,4,power_law_1.2,29.30408935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,power_law_1.01,17.542124938964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,balanced,8.240682601928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,4,power_law_1.2,43.53510437011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,power_law_1.01,38.484921264648435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,balanced,13.801039377848307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,power_law_1.01,79.20057373046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,4,power_law_1.2,100.38720703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,balanced,32.16217549641927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.23087360858917236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.19545600414276124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.2122431993484497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.23697280883789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.23651199340820311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.24929919242858886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.28615679740905764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,4,power_law_1.2,0.20544641017913817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.2694463968276978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,4,power_law_1.2,0.16660480499267577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,4,power_law_1.2,0.2764672040939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,4,power_law_1.2,0.20555520057678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,balanced,0.14453867077827454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,4,power_law_1.2,0.22848639488220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,4,power_law_1.2,0.28873600959777834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,balanced,0.22315732638041177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,4,power_law_1.2,0.2310784101486206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,balanced,0.4312906662623088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,balanced,0.4214080174763997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,4,power_law_1.2,0.276857590675354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,4,power_law_1.2,0.27802879810333253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,balanced,0.4199093182881673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,balanced,0.08996267120043437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,4,power_law_1.2,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,balanced,0.4229439894358317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,4,power_law_1.2,0.3044287919998169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,4,power_law_1.2,0.3427455902099609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,balanced,0.42337600390116376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,balanced,0.13078932960828146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,balanced,0.4227199951807658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,balanced,0.22755199670791626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,4,power_law_1.2,0.3081279993057251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,balanced,0.4315306742986043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,balanced,0.23141332467397055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,balanced,0.43773333231608075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,4,power_law_1.2,0.3033344030380249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,4,power_law_1.2,0.422054386138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,balanced,0.23154133558273315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,balanced,0.4484800100326538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,4,power_law_1.2,0.2993599891662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,balanced,0.4497599999109904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,balanced,0.23387734095255533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,4,power_law_1.2,0.5267072200775147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,balanced,0.4503093163172404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,balanced,0.23607999086380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,balanced,0.47488534450531006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,4,power_law_1.2,0.5145343780517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,balanced,0.23836266994476318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,balanced,0.48396801948547363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,4,power_law_1.2,0.3027008056640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,balanced,0.4781706730524699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,balanced,0.23796266317367554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,4,power_law_1.2,0.3369152069091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,4,power_law_1.2,0.4097919940948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,balanced,0.08451199531555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,balanced,0.48784534136454266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,balanced,0.24087466796239218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,4,power_law_1.2,0.34350080490112306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,balanced,0.5816320180892944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,4,power_law_1.2,0.533900785446167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,balanced,0.12485333283742268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,balanced,0.24525866905848184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,4,power_law_1.2,0.36867198944091795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,balanced,0.5672479867935181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,balanced,0.21928000450134277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,balanced,0.24506133794784546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,0.6512767791748046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,balanced,0.7243413130442301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,4,power_law_1.2,0.39301118850708006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,balanced,0.22329066197077432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,balanced,0.24798399209976196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,balanced,0.828010638554891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,0.9620608329772949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,balanced,0.22418665885925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,balanced,0.262992004553477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,4,power_law_1.2,0.39165439605712893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,balanced,1.2139626344045003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,balanced,0.22824533780415854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,balanced,0.26904000838597614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,4,power_law_1.2,0.6039296150207519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,1.1225088119506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,balanced,0.23060266176859537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,balanced,1.5440160433451335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,balanced,0.27563732862472534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,4,power_law_1.2,0.864684772491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,balanced,0.23181867599487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,1.8552703857421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.2,1.1288448333740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,balanced,0.28108266989390057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,balanced,2.3344906171162925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,balanced,0.3440693219502767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.2,1.5016768455505372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,2.5603967666625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,balanced,3.1975412368774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.2,2.032383918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,balanced,0.3487573464711507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,3.9428863525390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.01,0.18863359689712525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,balanced,0.453818678855896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.01,0.12483839988708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,balanced,0.2352480093638102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,6.124236679077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,balanced,4.7863467534383135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.2,3.0223104476928713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.01,0.20126719474792482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,balanced,0.5392746527989706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,balanced,0.2378186583518982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.01,0.1417088031768799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,7.3374076843261715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.01,0.28714239597320557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.2,3.899628829956055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.01,0.1627519965171814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,balanced,0.7661813100179037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.01,0.41610240936279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.01,0.23036160469055175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,balanced,7.577775955200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.2,6.403449249267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,10.634368133544921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,balanced,0.9641866683959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.01,0.4149695873260498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.01,0.23120639324188233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.2,8.879424285888671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,balanced,1.405669371287028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.01,0.22641921043395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.01,0.41913599967956544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,4,power_law_1.2,16.606675720214845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.01,0.2455359935760498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.01,0.4199999809265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,balanced,9.381290435791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,balanced,0.24446400006612143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.2,15.037759399414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,balanced,1.8232693672180176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.01,0.23884799480438232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.01,0.4348288059234619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,4,power_law_1.2,23.148806762695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,balanced,0.24841066201527914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.01,0.2502592086791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.01,0.45299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,power_law_1.01,0.13781119585037233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,balanced,0.2527199983596802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.01,0.2682368040084839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,balanced,2.697493235270182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.2,21.67121276855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.01,0.4939712047576904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,power_law_1.01,0.14597760438919066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,balanced,0.25761600335439044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.01,0.25362560749053953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,power_law_1.01,0.15474560260772705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.01,0.4667200088500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,balanced,14.117387135823568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,power_law_1.01,0.2241663932800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.01,0.26971518993377686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,4,power_law_1.2,42.93900756835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.01,0.5212672233581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,power_law_1.01,0.2257024049758911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,balanced,3.8351732889811196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,4,power_law_1.2,29.76911315917969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.01,0.28334081172943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,power_law_1.01,0.2321216106414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.01,0.5518080234527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,power_law_1.01,0.26502399444580077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.01,0.2848063945770264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,balanced,0.27505600452423096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.01,0.5161407947540283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,power_law_1.01,0.28970239162445066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.01,0.32693119049072267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,balanced,0.28272533416748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.01,0.5695168018341065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,balanced,4.9424692789713545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,balanced,0.2950826684633891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.01,0.33292160034179685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.01,0.5934400081634521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,4,power_law_1.2,42.299755859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,power_law_1.01,0.275219202041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.01,0.353600001335144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,balanced,0.393338680267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.01,0.6501120090484619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,power_law_1.01,0.28615679740905764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,balanced,0.4147786696751912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.01,0.4213247776031494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.01,0.696230411529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.01,0.48052477836608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.01,0.9127872467041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,balanced,36.32171630859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.01,0.6532415866851806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,power_law_1.01,0.2699007987976074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,balanced,8.157994588216146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.01,1.1980928421020507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.01,0.8272383689880372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,power_law_1.01,0.29361279010772706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,balanced,0.6247040033340454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.01,1.3827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.01,1.1595711708068848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,power_law_1.01,0.3147583961486816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.01,1.927769660949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.01,1.640025520324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,balanced,0.8575839996337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,4,power_law_1.2,103.61917724609376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,power_law_1.01,0.3246335983276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.01,2.3076608657836912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.01,2.8421823501586916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,balanced,1.290618658065796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,power_law_1.01,0.3319551944732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.01,2.548966407775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.01,4.573011016845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,balanced,1.7018240292867024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,power_law_1.01,0.3250112056732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.01,3.8301376342773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.01,5.259104156494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,power_law_1.01,0.45043201446533204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,balanced,2.556704044342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,power_law_1.01,0.6159552097320556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,balanced,15.778308868408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.01,6.394086456298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.01,7.796307373046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,power_law_1.01,0.718233585357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.01,6.930105590820313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,balanced,3.4273598988850913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.01,10.165849304199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,power_law_1.01,0.9393152236938477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.01,10.700991821289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,power_law_1.01,1.1798015594482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.01,14.618424987792968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,balanced,5.129178682963054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,power_law_1.01,2.160416030883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,power_law_1.01,2.38222713470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.01,22.03221740722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.01,20.178373718261717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,power_law_1.01,4.190937423706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,balanced,6.899445215861003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,power_law_1.01,5.123923110961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,power_law_1.01,8.788671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.01,44.00053100585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,power_law_1.01,10.605990600585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,balanced,8.821615854899088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,power_law_1.01,13.321363830566407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,power_law_1.01,27.606918334960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,balanced,14.371562957763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,power_law_1.01,54.942498779296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,balanced,32.66097513834635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,2,power_law_1.2,0.24277760982513427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,2,power_law_1.2,0.24255359172821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,2,power_law_1.2,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,2,power_law_1.2,0.41498241424560545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,2,power_law_1.2,0.4140672206878662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,2,power_law_1.2,0.42082557678222654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,2,power_law_1.2,0.445139217376709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,2,power_law_1.2,0.43182082176208497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,2,power_law_1.2,0.14893440008163453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,2,power_law_1.2,0.4862207889556885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,2,power_law_1.2,0.14357759952545165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,2,power_law_1.2,0.49402241706848143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,2,power_law_1.2,0.17745280265808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,2,power_law_1.2,0.46951680183410643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,2,power_law_1.2,0.11481599807739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,2,power_law_1.2,0.22902400493621827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,balanced,0.14082666238149008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,2,power_law_1.2,0.4955711841583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,2,power_law_1.2,0.2351232051849365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,balanced,0.2193386753400167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,2,power_law_1.2,0.1141759991645813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,2,power_law_1.2,0.523526382446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,2,power_law_1.2,0.242195200920105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,balanced,0.4100000063578288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,2,power_law_1.2,0.5276351928710937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,2,power_law_1.2,0.1457152009010315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,2,power_law_1.2,0.252729606628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,2,power_law_1.2,0.22288639545440675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,2,power_law_1.2,0.5353727817535401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,balanced,0.41546134154001874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,2,power_law_1.2,0.24944000244140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,2,power_law_1.2,0.217305588722229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,2,power_law_1.2,0.5850495815277099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,balanced,0.41204265753428143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,2,power_law_1.2,0.2569024085998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,2,power_law_1.2,0.24552319049835206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,2,power_law_1.2,0.6347648143768311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,balanced,0.4147040049235026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,2,power_law_1.2,0.27234559059143065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,2,power_law_1.2,0.2742399930953979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,2,power_law_1.2,0.7910655975341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,balanced,0.4171253442764282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,2,power_law_1.2,0.2630399942398071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,balanced,0.08905599514643352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,2,power_law_1.2,0.2824320077896118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,2,power_law_1.2,0.8652095794677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,balanced,0.41974933942159015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,2,power_law_1.2,0.27692160606384275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,balanced,0.12807466586430868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,2,power_law_1.2,1.0997504234313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,balanced,0.4304853280385335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,2,power_law_1.2,0.27898240089416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,balanced,0.22485866149266562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,2,power_law_1.2,1.4484031677246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,2,power_law_1.2,0.29461119174957273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,balanced,0.43194135030110675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,2,power_law_1.2,0.26956160068511964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,balanced,0.22843732436498007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,2,power_law_1.2,0.33483519554138186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,2,power_law_1.2,2.0743167877197264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,balanced,0.4410293499628703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,2,power_law_1.2,0.2808063983917236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,balanced,0.22994667291641235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,balanced,0.44228800137837726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,2,power_law_1.2,0.33648641109466554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,2,power_law_1.2,3.098681640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,balanced,0.23245332638422647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,balanced,0.4437066713968913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,2,power_law_1.2,0.37421441078186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.14272639751434327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,balanced,0.23548267285029092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,2,power_law_1.2,4.034912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,2,power_law_1.2,0.2737728118896484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,balanced,0.47037867705027264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.19341440200805665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,2,power_law_1.2,0.4679999828338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,balanced,0.2358986735343933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,2,power_law_1.2,0.2899967908859253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,2,power_law_1.2,5.423603057861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.21561601161956787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,balanced,0.23758933941523233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,2,power_law_1.2,0.5253952026367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,balanced,0.47175467014312744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,2,power_law_1.2,0.3113408088684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.387174391746521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,balanced,0.24054400126139322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,2,power_law_1.2,7.835635375976563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,2,power_law_1.2,0.7467648029327393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,balanced,0.08545600374539693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,balanced,0.48068265120188397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.4111231803894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,2,power_law_1.2,0.3462080001831055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,balanced,0.24478399753570557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.41086721420288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,2,power_law_1.2,0.8768063545227051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,balanced,0.5001386801401774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.4261375904083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,2,power_law_1.2,11.540889739990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,balanced,0.247706671555837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,balanced,0.12341866890589397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,2,power_law_1.2,1.3054143905639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.43038082122802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,balanced,0.5486613512039185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,2,power_law_1.2,0.3510656118392944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,balanced,0.25109867254892987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.43622398376464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,balanced,0.2190826733907064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,2,power_law_1.2,1.698739242553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,2,power_law_1.2,0.36394879817962644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,balanced,0.562661329905192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,balanced,0.26153600215911865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.44812798500061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,2,power_law_1.2,16.371302795410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,2,power_law_1.2,0.4643904209136963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.45951361656188966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,balanced,0.22307199239730835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,balanced,0.27170666058858234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,2,power_law_1.2,2.6505727767944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,balanced,0.7231626510620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.48820481300354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,2,power_law_1.2,0.5665279865264893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,balanced,0.2244266668955485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,balanced,0.27432000637054443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,2,power_law_1.2,3.1277439117431642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.5045504093170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,balanced,0.9163359800974528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,2,power_law_1.2,22.51131591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,2,power_law_1.2,0.7359551906585693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,balanced,0.22859734296798706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,balanced,0.2847413420677185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.5228479862213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,2,power_law_1.2,4.658662414550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.5523392200469971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,balanced,1.3039466540018718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,balanced,0.23269865910212198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,balanced,0.36110401153564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.5901247978210449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,2,power_law_1.2,1.0739904403686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,balanced,0.234224001566569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,2,power_law_1.2,5.332307052612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,balanced,0.36371731758117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.5734911918640136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,balanced,1.673525333404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.6738048076629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,2,power_law_1.2,1.300211238861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,balanced,0.5026986598968506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,2,power_law_1.2,52.34619140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.7425600051879883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,2,power_law_1.2,9.373741149902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,balanced,2.466053326924642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,2,power_law_1.2,2.148512077331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,balanced,0.5863413413365682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.9312704086303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.08802559971809387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.01,1.1625151634216309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,2,power_law_1.2,2.812620735168457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,2,power_law_1.2,12.090630340576173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,balanced,0.8434933026631674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,balanced,0.238319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.01,1.520627212524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,balanced,3.551919937133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.1126207947731018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.01,2.004934310913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,2,power_law_1.2,4.247443389892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,balanced,0.24141865968704224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,balanced,1.0083680152893066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.12651519775390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.01,2.8589120864868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,2,power_law_1.2,23.724147033691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.21802239418029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.01,3.741836929321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,2,power_law_1.2,6.000140762329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,balanced,5.285087903340657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,balanced,1.438810666402181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.01,5.495487976074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.22856318950653076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,2,power_law_1.2,8.361894226074218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.22839040756225587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.01,6.573926544189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,balanced,2.0769920349121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,balanced,6.37991460164388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.23872640132904052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.01,8.11181411743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,2,power_law_1.2,10.421612548828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.2344383955001831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,balanced,3.056415875752767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.01,13.1210693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,balanced,0.25144000848134357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.24039039611816407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,2,power_law_1.2,15.720697021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.2457792043685913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,balanced,8.030485153198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,balanced,0.25702933470408124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,balanced,3.971877415974935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.01,25.225190734863283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,balanced,0.2632693250974019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.25162880420684813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.25937280654907224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,2,power_law_1.2,28.034625244140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,balanced,0.27134400606155396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.2680959939956665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,balanced,0.2908959984779358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,balanced,4.921210606892903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.01,0.2860415935516357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.01,0.2971008062362671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,balanced,0.30250134070714313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,balanced,12.948623657226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.01,0.3071743965148926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.01,0.3484863996505737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,balanced,0.3179840048154195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,2,power_law_1.2,62.32957153320312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.01,0.4314112186431885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,balanced,0.43093331654866535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,balanced,7.697519938151042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,0.4568319797515869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,0.5822144031524659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,balanced,0.4835679928461711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,0.661843204498291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,balanced,0.7227786382039388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,0.909939193725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,1.124499225616455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,balanced,0.9710559844970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,balanced,25.22936503092448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,1.6516544342041015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,balanced,1.4529333114624023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,2.113580894470215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,balanced,15.088506062825521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,balanced,1.9170880317687988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,3.109779167175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,balanced,2.8626559575398765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,4.181209564208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.01,5.200236892700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,balanced,3.829445203145345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.01,7.709465789794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,balanced,5.789578755696614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.01,15.03387451171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,balanced,7.751525243123372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,balanced,9.887872060139975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,balanced,16.44325892130534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,balanced,36.5216064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.12080639600753784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.16431360244750975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.2454911947250366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,power_law_1.01,0.08439679741859436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.4059584140777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,power_law_1.01,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.41120638847351076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,power_law_1.01,0.12081279754638671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.4210752010345459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,power_law_1.01,0.2124351978302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.41692800521850587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,power_law_1.01,0.22370560169219972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,1,power_law_1.2,0.08818560242652893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.42945280075073244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,power_law_1.01,0.24019839763641357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,1,power_law_1.2,0.10666240453720092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.4315968036651611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,power_law_1.01,0.25125119686126707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,1,power_law_1.2,0.15457279682159425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.4615744113922119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.4587200164794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,1,power_law_1.2,0.2229248046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,power_law_1.01,0.2688960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.480620813369751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,1,power_law_1.2,0.2291775941848755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.48821120262145995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,1,power_law_1.2,0.23503360748291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.5123839855194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,power_law_1.01,0.26844799518585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,1,power_law_1.2,0.23569920063018798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.5298495769500733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,1,power_law_1.2,0.23970561027526854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,power_law_1.01,0.2660608053207397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.5485504150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,1,power_law_1.2,0.24376959800720216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.5629183769226074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,1,power_law_1.2,0.25144960880279543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.6629631996154786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,power_law_1.01,0.26625919342041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,1,power_law_1.2,0.2522239923477173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.7608704090118408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.9349632263183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,1,power_law_1.2,0.26092801094055174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,power_law_1.01,0.27149438858032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,1,power_law_1.2,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,1,power_law_1.2,1.13056640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,1,power_law_1.2,0.2598144054412842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,power_law_1.01,0.29114880561828616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,1,power_law_1.2,0.096806401014328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,1,power_law_1.2,0.28659839630126954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,1,power_law_1.2,1.5692543983459473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,power_law_1.01,0.31215360164642336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,1,power_law_1.2,0.12379519939422608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,1,power_law_1.2,0.3047039985656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,power_law_1.01,0.3214272022247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,1,power_law_1.2,1.9914560317993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,1,power_law_1.2,0.222707200050354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,1,power_law_1.2,0.3135551929473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,power_law_1.01,0.34442241191864015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,1,power_law_1.2,2.9247936248779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,1,power_law_1.2,0.3407104015350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,1,power_law_1.2,0.224070405960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,power_law_1.01,0.3861504077911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,1,power_law_1.2,0.4052864074707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,1,power_law_1.2,3.7746944427490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,power_law_1.01,0.4875135898590088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,1,power_law_1.2,0.24077439308166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,1,power_law_1.2,0.4582335948944092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.01,0.6098368167877197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,1,power_law_1.2,0.25516159534454347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,1,power_law_1.2,5.487750244140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.01,0.8578047752380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,1,power_law_1.2,0.5678400039672852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,1,power_law_1.2,0.26387839317321776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.01,1.0889535903930665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,1,power_law_1.2,0.6863615989685059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,1,power_law_1.2,6.526995086669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.01,1.5941503524780274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,1,power_law_1.2,0.9031359672546386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,1,power_law_1.2,1.131552028656006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.01,2.0888256072998046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,1,power_law_1.2,8.11928939819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,1,power_law_1.2,0.25747840404510497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,1,power_law_1.2,1.6527551651000976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.01,3.0362112045288088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,1,power_law_1.2,0.267903995513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,1,power_law_1.2,12.879347229003907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,1,power_law_1.2,2.125235176086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.01,3.99865608215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,1,power_law_1.2,3.130156707763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.01,5.9668224334716795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,1,power_law_1.2,0.2637696027755737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,1,power_law_1.2,25.10334014892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,1,power_law_1.2,4.175347137451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,1,power_law_1.2,0.27463040351867674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.01,7.892940521240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,1,power_law_1.2,0.29212160110473634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,1,power_law_1.2,0.31140480041503904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.01,9.913836669921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,1,power_law_1.2,5.217292785644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,1,power_law_1.2,0.3210047960281372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,1,power_law_1.2,0.33793280124664304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,1,power_law_1.2,7.667533111572266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,power_law_1.01,16.067091369628905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,1,power_law_1.2,0.39040000438690187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,1,power_law_1.2,0.4792640209197998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.2,0.6067391872406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,1,power_law_1.2,14.967015075683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,balanced,0.1097866694132487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.2,0.8389504432678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,power_law_1.01,34.371340942382815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.2,1.0696895599365235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,balanced,0.15094932913780212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.2,1.545081615447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,balanced,0.2651573419570923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.2,2.0143423080444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,balanced,0.490229328473409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.2,2.9647296905517577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,balanced,0.9461706479390463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.2,3.9091201782226563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,balanced,1.8513867060343425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.2,5.80975341796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,balanced,1.8550559679667156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,balanced,0.07763200004895528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.2,7.805184173583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,balanced,1.8355520566304524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,balanced,0.09949866930643718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,balanced,1.8425493240356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.2,9.700198364257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,balanced,0.1596213380495707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,balanced,1.8416694005330403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,balanced,0.2741919954617818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,balanced,1.875424067179362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,1,power_law_1.2,15.606950378417968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,balanced,0.5019253492355347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,balanced,1.8771360715230305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,balanced,0.954261302947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,balanced,0.9613920052846273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,balanced,1.8802080154418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,1,power_law_1.2,34.53484191894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,balanced,0.9583573341369629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,balanced,1.860597292582194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,balanced,0.9639519850413004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,balanced,1.870757261912028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,balanced,0.9615573088328043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,balanced,1.881333351135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,balanced,0.9775839646657308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,balanced,1.896959940592448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,balanced,0.9846826394399008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,balanced,1.9717493057250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,balanced,0.993173360824585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,balanced,0.08238933483759563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,balanced,0.9950133164723715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,balanced,2.0164106686909995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,balanced,0.1051626702149709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,balanced,1.0098666350046794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,balanced,0.18105065822601318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,balanced,2.073909282684326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,balanced,1.0128479798634846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,balanced,0.27480532725652057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,balanced,1.0356853008270264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,balanced,0.49769067764282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,balanced,2.1826133728027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,balanced,0.9392000039418539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,balanced,1.0575573444366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,balanced,0.9436853726704916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,balanced,2.260042667388916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,balanced,1.093125343322754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,balanced,0.9475786685943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,balanced,0.9520053068796793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,balanced,1.1344746748606365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,balanced,2.3677546183268228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,balanced,0.9560480117797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,balanced,0.9633119901021322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,balanced,1.21616530418396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,balanced,0.9711679617563883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,balanced,0.9783466657002767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,balanced,3.2167892456054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,balanced,1.2864747047424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,balanced,0.9913600285847982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.01,0.28947839736938474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,balanced,1.0101919968922932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,balanced,1.390874703725179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.01,0.4890880107879639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,balanced,1.0210506916046143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,balanced,3.341087977091471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.01,0.3363327980041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.01,0.4221759796142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,balanced,1.0428586800893147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.01,0.718559980392456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,balanced,1.7226452827453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.01,0.9304896354675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.01,1.3302335739135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.01,1.3469247817993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,balanced,3.85374387105306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,balanced,1.0969759623209636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.01,1.3905920028686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,balanced,1.930938720703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.01,1.473408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.01,1.5780415534973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.01,1.6180736541748046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.01,1.8006208419799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.01,1.6609216690063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.01,1.6717439651489259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,balanced,2.5454187393188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,balanced,1.1657226880391438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.01,1.7442304611206054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,balanced,5.117061297098796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.01,1.827552032470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,balanced,1.2661226590474446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.01,2.0123903274536135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.01,2.2105728149414063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,balanced,1.3603307406107585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.01,2.583161544799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.01,2.3292095184326174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,balanced,1.5811999638875325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.01,2.6955904006958007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,balanced,3.3060852686564126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.01,3.2315902709960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,balanced,1.7605013847351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.01,3.7921409606933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,balanced,5.9254506429036455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.01,4.845369720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.01,6.18590087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,balanced,2.537813345591227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.01,8.13406753540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.01,0.17719680070877075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.01,9.85726089477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.01,0.2676032066345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,balanced,2.9597813288370767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,balanced,3.9850667317708335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.01,13.219532775878907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.01,0.15072640180587768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.01,0.2348543882369995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.01,0.39059839248657224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.01,26.363418579101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.01,0.49431681632995605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.01,0.6646080017089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.01,0.7387712001800537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,balanced,4.300234794616699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.01,0.7589888095855712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,balanced,10.066789627075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,4,power_law_1.2,0.2915008068084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.01,0.7754623889923096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.01,0.8340607643127441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,4,power_law_1.2,0.50348801612854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,power_law_1.01,0.17281919717788696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.01,0.8320192337036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,4,power_law_1.2,0.19354239702224732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.01,0.8490495681762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,power_law_1.01,0.2847359895706177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,4,power_law_1.2,0.3818943977355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.01,0.8907327651977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,power_law_1.01,0.1896191954612732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.01,0.8860287666320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,4,power_law_1.2,0.6643328189849853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.01,0.9407232284545899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,balanced,5.966474533081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,power_law_1.01,0.25897600650787356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,balanced,6.15342394510905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,4,power_law_1.2,0.8324735641479493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.01,1.0531328201293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,power_law_1.01,0.3525824069976807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,4,power_law_1.2,1.3276415824890138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,power_law_1.01,0.4785344123840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.01,1.1468031883239747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,power_law_1.01,0.6650047779083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,4,power_law_1.2,1.3817855834960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.01,1.1262463569641112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,power_law_1.01,0.7260799884796143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,4,power_law_1.2,1.4078783988952637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.17848960161209107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.01,1.339840030670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,power_law_1.01,0.7384384155273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,power_law_1.01,0.7642879962921143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,4,power_law_1.2,1.47391996383667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.01,1.267033576965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,4,power_law_1.2,0.25569920539855956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,power_law_1.01,0.8245375633239747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,4,power_law_1.2,1.6367231369018556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,4,power_law_1.2,0.12473599910736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.01,1.4677311897277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,power_law_1.01,0.8600704193115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,4,power_law_1.2,1.7735935211181642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,4,power_law_1.2,0.2474047899246216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.01,1.6260032653808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,balanced,7.353621164957683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,power_law_1.01,0.9027263641357421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,4,power_law_1.2,0.34067840576171876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,4,power_law_1.2,1.8516992568969726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,power_law_1.01,0.9357439994812011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.01,2.1184959411621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,4,power_law_1.2,0.42500481605529783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,power_law_1.01,1.0033984184265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,4,power_law_1.2,1.7459327697753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.01,2.5212352752685545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,4,power_law_1.2,0.7014272212982178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,power_law_1.01,1.0890624046325683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,4,power_law_1.2,1.7975040435791017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,power_law_1.01,1.239948844909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,4,power_law_1.2,0.6900415897369385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.01,3.4777854919433593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,4,power_law_1.2,1.9090240478515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,4,power_law_1.2,0.7345727920532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.01,4.51464958190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,4,power_law_1.2,1.9367168426513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,4,power_law_1.2,0.7508543968200684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,power_law_1.01,1.2295231819152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,4,power_law_1.2,2.2451711654663087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,4,power_law_1.2,0.8069375991821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.01,5.330835342407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,4,power_law_1.2,2.4680448532104493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,4,power_law_1.2,0.8215680122375488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,4,power_law_1.2,2.957689666748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.01,7.511033630371093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.01,1.2574848175048827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,4,power_law_1.2,0.8353152275085449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,balanced,18.281487782796223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,4,power_law_1.2,2.6806400299072264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,4,power_law_1.2,0.9216447830200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.01,1.4864768028259276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,4,power_law_1.2,0.9263360023498535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.01,14.392658996582032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,4,power_law_1.2,2.9821184158325194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.01,1.7311424255371093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,4,power_law_1.2,0.9812607765197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.01,1.961471939086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,4,power_law_1.2,3.691750335693359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,4,power_law_1.2,1.0862848281860351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,balanced,12.847845713297525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.01,2.4685440063476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,4,power_law_1.2,4.291756820678711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,4,power_law_1.2,1.2209152221679687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.01,3.4654720306396483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,4,power_law_1.2,5.472601699829101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,1.234553623199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.01,4.171852874755859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,balanced,11.889413197835287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,1.4468352317810058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,4,power_law_1.2,6.372415924072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.01,6.608646392822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,1.3709952354431152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,4,power_law_1.2,8.131231689453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.01,7.6802818298339846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,1.556230354309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,1.846873664855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,power_law_1.01,9.891629028320313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,4,power_law_1.2,9.84936294555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,2.3095680236816407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.01,16.259706115722658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,4,power_law_1.2,16.017414855957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,2.919718360900879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,3.7399551391601564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.01,31.86040344238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,4,power_law_1.2,35.90862121582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,5.088256072998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,4,power_law_1.2,5.473177719116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,4,power_law_1.2,8.905913543701171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,4,power_law_1.2,16.913427734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,balanced,25.919504801432293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,4,power_law_1.2,0.17310719490051268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,4,power_law_1.2,0.2643071889877319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,4,power_law_1.2,0.1383679986000061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,4,power_law_1.2,0.23482880592346192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,4,power_law_1.2,0.3611135959625244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,4,power_law_1.2,0.4577536106109619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,4,power_law_1.2,0.6725247859954834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,4,power_law_1.2,0.6932096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,4,power_law_1.2,0.7234560012817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,4,power_law_1.2,0.785971212387085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,4,power_law_1.2,0.8463295936584473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,4,power_law_1.2,0.8800831794738769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,4,power_law_1.2,0.928223991394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,4,power_law_1.2,0.9932479858398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,4,power_law_1.2,1.0975296020507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,4,power_law_1.2,1.1306752204895019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,4,power_law_1.2,1.2875712394714356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,4,power_law_1.2,1.3310400009155274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,balanced,0.10804266730944316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.2,1.3259008407592774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,balanced,0.15266666809717813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,balanced,0.2644266684850057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,balanced,0.0775786687930425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.2,1.637548828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,balanced,0.4959253470102946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,balanced,0.9481226603190104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.2,1.8746944427490235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,balanced,0.10072533289591472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,balanced,1.8613279660542805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,balanced,0.1577173372109731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,balanced,1.8695573806762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.2,2.213235282897949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,balanced,1.8445919354756672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,balanced,0.27642667293548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.2,2.4417280197143554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,balanced,1.8548587163289387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,balanced,0.5045706828435262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,balanced,1.854474703470866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.2,3.511257553100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,balanced,0.9608426888783773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,balanced,1.8645280202229817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,balanced,1.875343958536784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,balanced,0.9758773644765218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.2,4.804735946655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,balanced,1.8822399775187175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,balanced,0.9732000033060709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,balanced,1.8948319753011067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,balanced,0.9778506755828857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.2,6.5634819030761715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,balanced,1.902656078338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,balanced,0.9898026784261068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,balanced,1.9169386227925618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,balanced,0.9941386381785074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,balanced,1.9378827412923176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.2,8.332959747314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,balanced,0.9973226388295492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,balanced,2.029791990915934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,balanced,1.0107573668162029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,4,power_law_1.2,10.513664245605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,balanced,2.0993119875590005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,balanced,1.0114986896514893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,balanced,2.1650613149007163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,balanced,1.041274627049764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.2,17.157203674316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,balanced,1.0453706582387288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,balanced,2.301482677459717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.01,0.17562880516052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,balanced,0.09668800234794617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,balanced,1.0655146439870198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.01,0.2632575988769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,balanced,1.0978986422220867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,balanced,0.11691733201344807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,balanced,2.4413973490397134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.01,0.2140415906906128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,balanced,0.18890666961669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,balanced,1.1404106616973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.2,35.39937133789063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,balanced,0.2906986673672994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.01,0.37150719165802004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,balanced,0.5104480187098185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.01,0.611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,balanced,1.214629332224528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,balanced,2.592672030131022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,balanced,0.9531520207722982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.01,0.8974207878112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.01,0.11020799875259399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,balanced,0.9600906372070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,balanced,1.2920479774475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.01,1.307539176940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,balanced,0.9663413365681967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.01,1.3603391647338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.01,0.15679359436035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,balanced,3.0922346115112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.01,1.3827263832092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,balanced,0.973082701365153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,balanced,1.4436160723368328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.01,0.1361791968345642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.01,1.4460160255432128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,balanced,0.9787733554840088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.01,0.22119040489196778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,power_law_1.01,0.13829760551452636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.01,1.4962112426757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,balanced,0.9904373486836752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,balanced,1.6108959515889485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.01,1.5531583786010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.01,0.3642303943634033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,power_law_1.01,0.18935680389404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,balanced,3.34713077545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,balanced,1.0016533533732097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.01,1.5814335823059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,2,power_law_1.2,0.17546240091323853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,power_law_1.01,0.14203519821166993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.01,0.4807487964630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.01,1.6217023849487304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,balanced,1.0130346616109211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,2,power_law_1.2,0.2634687900543213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,power_law_1.01,0.2235327959060669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.01,0.6735487937927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.01,1.65283203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,balanced,2.014901320139567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,2,power_law_1.2,0.19169919490814208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,balanced,1.0303733348846436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.01,1.7452735900878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,power_law_1.01,0.3563647985458374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.01,0.7365439891815185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,2,power_law_1.2,0.33748478889465333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.01,1.791654396057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,power_law_1.01,0.49992961883544923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,balanced,1.0546613534291585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.01,0.7610303878784179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.01,1.9775423049926757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,balanced,1.0735999743143718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,2,power_law_1.2,0.5475135803222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,balanced,4.252496083577474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,power_law_1.01,0.7353216171264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.01,0.754099178314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.01,2.1867904663085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,balanced,2.2897226015726724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,balanced,1.1198026339213054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,2,power_law_1.2,0.7563519954681397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.01,0.8080384254455566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,power_law_1.01,0.7378816127777099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.01,2.4847232818603517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,2,power_law_1.2,1.2263872146606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.01,0.8603072166442871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,power_law_1.01,0.7898816108703614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.01,2.5295103073120115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.01,0.8901120185852051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.01,2.913350486755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,2,power_law_1.2,1.3323904037475587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,power_law_1.01,0.7974847793579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.01,0.9023360252380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.01,2.9336448669433595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,2,power_law_1.2,1.3969408035278321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,power_law_1.01,0.8383808135986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,balanced,1.213327964146932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.01,0.9162431716918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.01,3.522137451171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,balanced,3.10753599802653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,power_law_1.01,0.9216256141662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,2,power_law_1.2,1.4607935905456544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,balanced,5.634442647298177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.01,4.353683090209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.01,0.9598143577575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,2,power_law_1.2,1.5098112106323243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,power_law_1.01,0.9568639755249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.01,1.0124159812927247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.01,5.984435272216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,2,power_law_1.2,1.590988826751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,power_law_1.01,1.009280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.01,1.1210495948791503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.01,6.99450912475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,2,power_law_1.2,1.6062911987304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,power_law_1.01,1.060537624359131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.01,1.1230079650878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.01,8.425849914550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,2,power_law_1.2,1.6663232803344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,power_law_1.01,1.131500816345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.01,1.2699007987976074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,balanced,1.3128853638966878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,2,power_law_1.2,1.75863037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,power_law_1.01,1.2618559837341308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,balanced,4.234218597412109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.01,1.3418944358825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.01,13.705619812011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,2,power_law_1.2,1.805619239807129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.01,1.5502976417541503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,balanced,1.47652800877889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,2,power_law_1.2,1.88023681640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,balanced,7.696762720743815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.01,1.7923904418945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,power_law_1.01,1.3799039840698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.01,24.91887969970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,balanced,1.6236000061035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,2,power_law_1.2,2.047942352294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.01,2.437062454223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,2,power_law_1.2,2.2141887664794924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.01,2.7371967315673826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,power_law_1.01,1.3582079887390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,balanced,2.003392060597738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,2,power_law_1.2,2.5563968658447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.01,3.7927169799804688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,power_law_1.01,1.606470489501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,2,power_law_1.2,2.616659164428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,power_law_1.01,1.9259136199951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,balanced,4.918154716491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.01,4.8627777099609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,balanced,2.3098719914754233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,2,power_law_1.2,3.0854976654052733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,power_law_1.01,2.3315263748168946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.01,5.764972686767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,2,power_law_1.2,3.211404800415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,power_law_1.01,2.8701311111450196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,2,power_law_1.2,3.895507049560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.01,9.023737335205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,balanced,3.462421417236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,power_law_1.01,4.020601654052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,2,power_law_1.2,4.638623809814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,power_law_1.01,4.794796752929687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,2,power_law_1.2,6.336108779907226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.01,16.663282775878905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,balanced,13.275375366210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,power_law_1.01,7.131251525878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,2,power_law_1.2,7.187500762939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,balanced,4.210954666137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,power_law_1.01,9.125286102294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,2,power_law_1.2,8.457478332519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,power_law_1.01,10.527378845214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,2,power_law_1.2,14.487814331054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,balanced,8.234629313151041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,power_law_1.01,18.087391662597657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,balanced,6.0313065846761065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,power_law_1.2,24.715110778808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,power_law_1.01,37.02901611328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,balanced,8.296597162882486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,balanced,10.27459716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,2,balanced,25.139658610026043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,2,power_law_1.2,0.11005439758300781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,2,power_law_1.2,0.1556671977043152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,balanced,16.289061228434246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,2,power_law_1.2,0.12038400173187255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,2,power_law_1.2,0.2019200086593628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,2,power_law_1.2,0.315775990486145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,2,power_law_1.2,0.39874560832977296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,2,power_law_1.2,0.6467775821685791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,balanced,17.190789540608723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,2,power_law_1.2,0.7004096031188964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,2,power_law_1.2,0.7279295921325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,2,power_law_1.2,0.760748815536499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,2,power_law_1.2,0.7956607818603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,2,power_law_1.2,0.8433088302612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,2,power_law_1.2,0.8678912162780762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,2,power_law_1.2,0.9094271659851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,2,power_law_1.2,0.9771007537841797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,2,power_law_1.2,0.9834431648254395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,2,power_law_1.2,1.0216192245483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,2,power_law_1.2,1.1688384056091308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,2,power_law_1.2,1.1866047859191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,2,power_law_1.2,1.3999551773071288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,2,power_law_1.2,1.4127231597900392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,2,power_law_1.2,1.7059711456298827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,2,power_law_1.2,1.9321088790893555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,2,power_law_1.2,2.5701120376586912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,2,power_law_1.2,3.066636848449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,2,power_law_1.2,4.226508712768554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,2,power_law_1.2,5.104684829711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,2,power_law_1.2,0.13725440502166747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,2,power_law_1.2,0.18645119667053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,2,power_law_1.2,5.976102447509765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,2,power_law_1.2,0.13768320083618163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,2,power_law_1.2,0.2315903902053833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,2,power_law_1.2,8.617984008789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,2,power_law_1.2,0.3245055913925171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,balanced,34.680102030436196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,2,power_law_1.2,0.4345983982086182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,2,power_law_1.2,0.6595327854156494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,2,power_law_1.2,19.453266906738282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,2,power_law_1.2,0.71943678855896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,2,power_law_1.2,0.7526591777801513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,2,power_law_1.2,0.7917247772216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,2,power_law_1.2,0.826636791229248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,2,power_law_1.2,0.8823871612548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,2,power_law_1.2,0.8833215713500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,2,power_law_1.2,1.0101375579833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,2,power_law_1.2,1.1040575981140137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,2,power_law_1.2,1.1410240173339843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,balanced,0.10300266742706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,2,power_law_1.2,1.278553581237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,balanced,0.154341330130895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,2,power_law_1.2,1.3915200233459473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,balanced,0.264357328414917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,balanced,0.08036800225575765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,balanced,0.5008106629053751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,2,power_law_1.2,1.447763156890869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,balanced,0.10413333773612976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,balanced,0.9754400253295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,balanced,0.16236799955368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,2,power_law_1.2,1.69866886138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,balanced,0.28493332862854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,balanced,1.8832319577534993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,2,power_law_1.2,2.0409664154052733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,balanced,0.5256160100301107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,balanced,1.8886559804280598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,2,power_law_1.2,2.3973440170288085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,balanced,1.004479964574178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,balanced,1.9117387135823567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,balanced,1.0338986714680989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,2,power_law_1.2,3.0588287353515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,balanced,1.9228906631469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,balanced,1.00764266649882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,2,power_law_1.2,4.133894348144532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,balanced,1.0144480069478352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,balanced,1.9269067446390789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,balanced,0.13541866342226663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,balanced,1.0420640309651692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,2,power_law_1.2,5.414828872680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,balanced,1.9149707158406575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,balanced,1.0357866287231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,balanced,0.1507146656513214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,2,power_law_1.2,7.241600036621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,balanced,0.21694932381312051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,balanced,1.0486186345418294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,balanced,1.9347519874572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,balanced,0.31380800406138104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,balanced,1.0510400136311848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,balanced,1.9338560104370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,2,power_law_1.2,9.710310363769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,balanced,0.5447253386179606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,balanced,1.063370704650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,balanced,1.9190346399943035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,balanced,1.014309326807658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,balanced,1.0262080033620198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,balanced,1.0798880259195964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,balanced,1.9365439414978027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,2,power_law_1.2,12.283475494384765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,balanced,1.035200039545695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,balanced,1.0953173637390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,balanced,1.9480106035868328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,balanced,1.0481493473052979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.11110399961471558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,balanced,1.1355626583099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,balanced,1.970256010691325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,2,power_law_1.2,19.53180847167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,balanced,1.0538240273793538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.15415680408477783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,balanced,1.1869280338287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,balanced,1.0702239672342937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,balanced,2.098735968271891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.17244800329208373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,balanced,1.0872480074564617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,balanced,1.2903146743774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,balanced,2.19266668955485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.3707263946533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,balanced,1.105130672454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,2,power_law_1.2,34.72066040039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,balanced,1.4143679936726887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.6280640125274658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,balanced,1.147333304087321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,balanced,2.309984048207601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.07827839851379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.8957056045532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,balanced,1.1882399717966716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.10119680166244507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,balanced,1.5160959561665852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,balanced,2.4755147298177085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,balanced,1.2265013058980305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.01,1.27007999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.11278719902038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.01,1.3271552085876466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,balanced,1.2896640300750732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.01,0.22744319438934327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,balanced,1.7868852615356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,balanced,2.737589200337728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.01,1.4485312461853028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.01,0.34004480838775636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.01,1.4649855613708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.01,0.47964158058166506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,balanced,2.0488425890604653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.01,1.4965760231018066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.01,0.6824639797210693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,balanced,3.06280517578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,balanced,1.451514720916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.01,0.6943039894104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.01,1.5697216033935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.01,0.7514111995697021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.01,1.6225536346435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,balanced,2.721743901570638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,balanced,3.633791923522949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.01,0.7700863838195801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.01,1.6455615997314452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.01,0.8046719551086425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.01,1.716806411743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.01,0.8538944244384765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.01,1.7543615341186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,balanced,3.35042667388916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.01,0.8928704261779785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,balanced,1.6378240585327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.01,1.8394432067871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,balanced,4.365088144938151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.01,0.9223360061645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.01,2.0238975524902343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,balanced,1.9433973630269368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.01,0.9668288230895996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.01,2.172064018249512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.01,1.0230400085449218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,balanced,2.22212807337443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.01,2.5576383590698244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.01,1.0472576141357421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,balanced,4.638175964355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.01,2.5239679336547853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.01,1.2039936065673829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,balanced,2.8954292933146157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.01,2.956934356689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,balanced,5.65662956237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,1.2726592063903808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.01,3.066419219970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,1.4042943954467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.01,3.790060806274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,1.5155584335327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,balanced,3.4694560368855796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.01,4.82861442565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,1.8054784774780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,2.057587242126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.01,6.634342193603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,balanced,5.663045247395833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,2.725017547607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.01,8.363475036621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,balanced,5.227984110514323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,balanced,7.367189407348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,3.410988616943359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.01,10.451078033447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,4.714886474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,5.976134490966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.01,17.16474304199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,balanced,6.436453501383464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.01,7.546886444091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,balanced,7.473578770955403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.01,29.893771362304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.01,11.756658935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,balanced,8.717882792154947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.01,23.374630737304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.10143359899520873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,balanced,9.46941884358724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.15006719827651976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.18202879428863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,power_law_1.01,0.13286399841308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.3516992092132568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,power_law_1.01,0.1598080039024353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.5326464176177979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,power_law_1.01,0.1695039987564087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.7669119834899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,1,power_law_1.2,1.2442815780639649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,power_law_1.01,0.25929598808288573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,balanced,12.577770233154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,1,power_law_1.2,1.3323776245117187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,balanced,10.893285115559896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,power_law_1.01,0.38490240573883056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,power_law_1.01,0.5051712036132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,1,power_law_1.2,1.3754816055297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,power_law_1.01,0.7171328067779541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,1,power_law_1.2,1.4844160079956055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,1,power_law_1.2,1.558035182952881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,power_law_1.01,0.7668799877166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,balanced,13.733839670817057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,1,power_law_1.2,1.5751808166503907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,power_law_1.01,0.7941247940063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,power_law_1.01,0.8266304016113282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,1,power_law_1.2,1.5913023948669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,power_law_1.01,0.8736895561218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,1,power_law_1.2,1.699648094177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,1,power_law_1.2,1.8255359649658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,power_law_1.01,0.9273152351379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,balanced,15.673802693684896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,1,power_law_1.2,1.8117504119873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,power_law_1.01,0.9813119888305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,1,power_law_1.2,1.8815231323242188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,power_law_1.01,1.0622655868530273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,power_law_1.01,1.1551551818847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,1,power_law_1.2,2.099135971069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,power_law_1.01,1.2230719566345214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,power_law_1.01,1.3819007873535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,1,power_law_1.2,2.2747520446777343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,1,power_law_1.2,2.5619327545166017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,power_law_1.01,1.473203182220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,1,power_law_1.2,2.6095680236816405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,1,power_law_1.2,2.995404815673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.01,1.632441520690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,1,power_law_1.2,3.3904769897460936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.01,2.044704055786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,1,power_law_1.2,4.156006240844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.01,2.416543960571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,1,power_law_1.2,5.086304092407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.01,3.027071952819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,balanced,25.77367401123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,1,power_law_1.2,6.892646026611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.01,3.767001724243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.07858560085296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,balanced,21.590609232584637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,1,power_law_1.2,8.803660583496093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.01,5.240505599975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.09957759976387023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.1208191990852356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.01,6.715711975097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,1,power_law_1.2,10.564627075195313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.20258560180664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,1,power_law_1.2,0.28822400569915774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.01,9.753298950195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,1,power_law_1.2,17.015744018554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,1,power_law_1.2,0.41077117919921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,balanced,27.674596150716145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.01,12.726009368896484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,1,power_law_1.2,0.6597504138946533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,1,power_law_1.2,0.6958784103393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,1,power_law_1.2,29.141253662109374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.01,15.8025146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,1,power_law_1.2,0.7442368030548095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,1,power_law_1.2,0.7846335887908935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,1,power_law_1.2,0.808620834350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,power_law_1.01,25.080300903320314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,1,power_law_1.2,0.8519743919372559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,1,power_law_1.2,0.9104000091552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,1,power_law_1.2,0.9402239799499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,power_law_1.01,50.155889892578124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,1,power_law_1.2,0.9992639541625976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,1,power_law_1.2,1.068019199371338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,1,power_law_1.2,1.1180607795715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,1,power_law_1.2,1.2601471900939942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,1.3072959899902343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,1.5344511985778808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,1.6112447738647462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,1.8391359329223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,balanced,52.66231791178385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,2.177926445007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,2.836089515686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,3.461638259887695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,4.782783889770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,6.234508895874024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,1,power_law_1.2,7.736083221435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,balanced,0.03223466624816259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,balanced,0.03372266640265783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,1,power_law_1.2,11.774521636962891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,balanced,0.0481333335240682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,balanced,0.0774293343226115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,balanced,0.12622400124867758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,1,power_law_1.2,0.1289728045463562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,1,power_law_1.2,23.160231018066405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,balanced,0.1253919998804728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,1,power_law_1.2,0.15923839807510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,balanced,0.1260426640510559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,1,power_law_1.2,0.1626688003540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,balanced,0.12760532895723978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,1,power_law_1.2,0.23306241035461425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,balanced,0.1276586651802063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,1,power_law_1.2,0.3357055902481079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,balanced,0.12786133090655008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,1,power_law_1.2,0.46645121574401854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,balanced,0.12867200374603271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,1,power_law_1.2,0.6915328025817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,balanced,0.13146133224169412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,1,power_law_1.2,0.7327680110931396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,balanced,0.13131733735402426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,balanced,0.13340800007184347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,1,power_law_1.2,0.7808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,balanced,0.1414240002632141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,1,power_law_1.2,0.8069055557250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,balanced,0.14389866590499878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,1,power_law_1.2,0.874675178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,balanced,0.14964266618092856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,1,power_law_1.2,0.9431743621826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,balanced,0.15802133083343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,1,power_law_1.2,0.976921558380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,1,power_law_1.2,1.0599295616149902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,balanced,0.16690667470296225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,1,power_law_1.2,1.1750847816467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,balanced,0.1790026624997457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,1,power_law_1.2,1.2564607620239259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,balanced,0.2003999948501587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,1,power_law_1.2,1.4215935707092284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,balanced,0.22779200474421182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,1,power_law_1.2,1.5651391983032226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,balanced,0.2545013427734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.2,1.701523208618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.2,2.096467208862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,balanced,0.3485333522160848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.2,2.4950719833374024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.2,3.113580894470215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,balanced,0.032458665470282234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.2,3.860697555541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,balanced,0.031514666974544525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,balanced,0.03706666578849157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,balanced,0.41416533788045246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.2,5.336294555664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,balanced,0.06048533320426941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,balanced,0.08548800150553386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,balanced,0.08656533559163411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.2,6.806400299072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,balanced,0.08638399839401245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,balanced,0.0865760048230489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.2,9.842086029052734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,balanced,0.08731200297673543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,balanced,0.08841600020726521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,balanced,0.08774933218955994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,balanced,0.5920053323109945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.2,12.794566345214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,balanced,0.09099733829498291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,balanced,0.0913813312848409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,balanced,0.09331732988357544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.2,15.831558227539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,power_law_1.01,0.04979200065135956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,balanced,0.09868266185124715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,power_law_1.01,0.04670720100402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,balanced,0.10061867038408916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,power_law_1.01,0.04465279877185822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,balanced,0.10563199718793233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,1,power_law_1.2,25.143775939941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,power_law_1.01,0.06183040142059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,balanced,0.11440533399581909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,power_law_1.01,0.08429440259933471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,balanced,0.7842240333557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,balanced,0.12444800138473511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,power_law_1.01,0.11183359622955322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,balanced,0.03148799886306127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,balanced,0.14015466968218485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,power_law_1.01,0.11729279756546021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,power_law_1.01,0.03805440068244934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,1,power_law_1.2,49.93368835449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,balanced,0.03311466674009959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,power_law_1.01,0.11640959978103638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,balanced,0.03584533433119456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,balanced,0.15527466932932535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,power_law_1.01,0.036396801471710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,power_law_1.01,0.12312320470809937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,balanced,0.05574400226275126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,power_law_1.01,0.04163840115070343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,balanced,0.07891199986139934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,power_law_1.01,0.12339839935302735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,balanced,0.20222934087117514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,balanced,0.0814933329820633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,power_law_1.01,0.05272960066795349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,power_law_1.01,0.12559360265731812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,balanced,0.08239999910195668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,power_law_1.01,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,balanced,0.08252800007661183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,power_law_1.01,0.13006080389022828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,balanced,0.0832533339659373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,balanced,0.2322346568107605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,power_law_1.01,0.07655680179595947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,balanced,0.9751733144124349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,power_law_1.01,0.13086719512939454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,balanced,0.08549333612124126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,power_law_1.01,0.08087679743766785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,balanced,0.08649067083994548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,power_law_1.01,0.1376960039138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,balanced,0.08794132868448894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,power_law_1.01,0.08223999738693237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,power_law_1.01,0.14718079566955566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,balanced,0.3230773409207662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,balanced,0.08950400352478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,power_law_1.01,0.08190079927444457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,power_law_1.01,0.15311360359191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,power_law_1.01,0.08440319895744323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,balanced,0.09238400061925252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,power_law_1.01,0.1557055950164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,power_law_1.01,0.08807039856910706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,power_law_1.01,0.08894079923629761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,power_law_1.01,0.16490880250930787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,power_law_1.01,0.09181439876556396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,power_law_1.01,0.1792512059211731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,balanced,0.4035573403040568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,power_law_1.01,0.09382399916648865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,power_law_1.01,0.20627200603485107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,power_law_1.01,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,balanced,0.10044266780217488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,power_law_1.01,0.23596160411834716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,power_law_1.01,0.10444799661636353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,balanced,0.10203199585278828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,power_law_1.01,0.2860415935516357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,power_law_1.01,0.1106112003326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,power_law_1.01,0.31553919315338136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,power_law_1.01,0.12947200536727904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,power_law_1.01,0.03529599905014038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,power_law_1.01,0.43158397674560545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,power_law_1.01,0.13740160465240478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,power_law_1.01,0.5855231761932373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,power_law_1.01,0.03468799889087677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,power_law_1.01,0.16275839805603026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,balanced,0.5785066684087118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,balanced,1.4926667213439941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,power_law_1.01,0.7492159843444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,power_law_1.01,0.03928320109844208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,power_law_1.01,0.1915071964263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,power_law_1.01,0.9956928253173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,power_law_1.01,0.05135359764099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,power_law_1.01,0.2470400094985962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,power_law_1.01,1.3438719749450683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,balanced,0.11098666985829671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,power_law_1.01,0.058950400352478026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,power_law_1.01,0.2856703996658325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,power_law_1.01,0.07712000012397766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,power_law_1.01,2.226655960083008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,balanced,0.12530666589736938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,power_law_1.01,0.4169407844543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,power_law_1.01,0.08012160062789916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,power_law_1.01,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,balanced,0.13421333829561868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,power_law_1.01,3.984729766845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,power_law_1.01,0.701862382888794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,power_law_1.01,0.08034560084342957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,balanced,0.16802134116490683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,balanced,0.7584693431854248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,power_law_1.01,0.08405759930610657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,power_law_1.01,1.0044992446899415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,4,power_law_1.2,0.050310397148132326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,power_law_1.01,0.08471680283546448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,power_law_1.01,1.1675519943237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,balanced,0.1865546703338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,4,power_law_1.2,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,power_law_1.01,0.08782079815864563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,power_law_1.01,1.949465560913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,power_law_1.01,0.09238399863243103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,4,power_law_1.2,0.0453247994184494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,balanced,0.27431466182072956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,power_law_1.01,0.09448959827423095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,4,power_law_1.2,0.05612800121307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,power_law_1.01,3.951366424560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,power_law_1.01,0.10525439977645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,4,power_law_1.2,0.0725055992603302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,balanced,0.33643198013305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,4,power_law_1.2,0.11106560230255128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,4,power_law_1.2,0.11452800035476685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,power_law_1.01,0.11036159992218017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,balanced,0.9392480055491129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,4,power_law_1.2,0.12286080121994018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,power_law_1.01,0.1155135989189148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,balanced,0.49088533719380695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,4,power_law_1.2,0.12350080013275147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,4,power_law_1.2,0.12789759635925294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,power_law_1.01,0.12071679830551148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,4,power_law_1.2,0.13171199560165406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,power_law_1.01,0.13656959533691407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,balanced,0.6397973299026489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,4,power_law_1.2,0.13322880268096923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,power_law_1.01,0.1610751986503601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,4,power_law_1.2,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,power_law_1.01,0.19976320266723632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,4,power_law_1.2,0.131660795211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,power_law_1.01,0.28044800758361815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,4,power_law_1.2,0.14929920434951782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,power_law_1.01,0.3646719932556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,balanced,2.764373461405436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,4,power_law_1.2,0.16353919506072997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,balanced,0.9351253509521484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,power_law_1.01,0.48699522018432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,4,power_law_1.2,0.15835520029067993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,power_law_1.01,0.6429440021514893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,4,power_law_1.2,0.17415039539337157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,balanced,1.4579946200052898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,4,power_law_1.2,0.1875391960144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,power_law_1.01,0.8854656219482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,4,power_law_1.2,0.22005119323730468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,power_law_1.01,1.2000831604003905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,4,power_law_1.2,0.2573951959609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,power_law_1.01,1.636524772644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,4,power_law_1.2,0.3230720043182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,balanced,1.2263092994689941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,power_law_1.01,2.2075008392333983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,4,power_law_1.2,0.35431039333343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,power_law_1.01,3.3249279022216798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,4,power_law_1.2,0.4891712188720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,4,power_law_1.2,0.685868787765503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,power_law_1.01,6.878144073486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,4,power_law_1.2,0.8118847846984864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,4,power_law_1.2,1.2280447959899903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,4,power_law_1.2,1.6059711456298829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,balanced,1.519594669342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,4,power_law_1.2,2.437625694274902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,4,power_law_1.2,5.9448894500732425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,balanced,2.802501360575358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,4,power_law_1.2,0.037503999471664426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,balanced,2.3960960706075034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,4,power_law_1.2,0.03544319868087768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,4,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,4,power_law_1.2,0.05118719935417175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,4,power_law_1.2,0.05898879766464234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,4,power_law_1.2,0.07712640166282654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,4,power_law_1.2,0.08162559866905213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,4,power_law_1.2,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,4,power_law_1.2,0.08201599717140198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,4,power_law_1.2,0.08540800213813782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,4,power_law_1.2,0.08790400028228759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,4,power_law_1.2,0.08778240084648133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,4,power_law_1.2,0.0953984022140503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,4,power_law_1.2,0.09700480103492737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,4,power_law_1.2,0.10303360223770142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,4,power_law_1.2,0.11080319881439209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,4,power_law_1.2,0.11643520593643189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,4,power_law_1.2,0.13052159547805786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,4,power_law_1.2,0.14407680034637452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,4,power_law_1.2,0.17825920581817628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,4,power_law_1.2,0.21089279651641846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,4,power_law_1.2,0.26445438861846926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,4,power_law_1.2,0.28015999794006347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,4,power_law_1.2,0.43966078758239746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,4,power_law_1.2,0.5506303787231446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,balanced,4.759039878845215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,4,power_law_1.2,0.8523520469665528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,4,power_law_1.2,1.0839167594909669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,4,power_law_1.2,1.3334079742431642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,balanced,0.028197333216667175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,4,power_law_1.2,2.2589439392089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,balanced,0.03279466678698858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,balanced,0.04877866804599762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,4,power_law_1.2,0.034835198521614076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,4,power_law_1.2,5.300979232788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,balanced,0.07732800145943959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,4,power_law_1.2,0.03531520068645477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,balanced,0.1264693339665731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,4,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,balanced,0.1265120009581248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,4,power_law_1.2,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,balanced,0.12710932890574136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,4,power_law_1.2,0.053523200750350955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,balanced,0.1288426617781321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,4,power_law_1.2,0.07745280265808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,balanced,0.12935466567675272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,4,power_law_1.2,0.07928959727287292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,balanced,0.12916800379753113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,4,power_law_1.2,0.0809664011001587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,balanced,0.13140267133712769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,4,power_law_1.2,0.08483200073242188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,balanced,0.13379200299580893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,balanced,0.033786666889985405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,4,power_law_1.2,0.08663679957389832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,balanced,0.13526399930318198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,balanced,0.03393599887688955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,4,power_law_1.2,0.09115520119667053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,balanced,0.1369493305683136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,balanced,0.03788266579310099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,4,power_law_1.2,0.09416319727897644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,balanced,0.060453335444132485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,balanced,0.1455519994099935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,4,power_law_1.2,0.09758719801902771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,balanced,0.08531733353932698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,4,power_law_1.2,0.10440319776535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,balanced,0.14844800035158792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,balanced,0.08675199747085571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,balanced,0.15862933794657388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,balanced,0.0879253347714742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,balanced,0.17005866765975952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,4,power_law_1.2,0.11292159557342529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,balanced,0.088128000497818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,4,power_law_1.2,0.11396479606628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,balanced,0.18386133511861166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,balanced,0.08996267120043437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,balanced,0.09045867125193278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,balanced,0.20227199792861938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,balanced,0.09219200412432353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,balanced,0.09425600369771321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,4,power_law_1.2,0.1292672038078308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,balanced,0.0953653355439504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,balanced,0.22032000621159872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,4,power_law_1.2,0.1497215986251831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,balanced,0.09938133756319682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,4,power_law_1.2,0.1721791982650757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,balanced,0.1058026651541392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,balanced,0.27642132838567096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,4,power_law_1.2,0.20246400833129882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,balanced,0.10802132884661357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,4,power_law_1.2,0.2769599914550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,balanced,0.11762666702270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,balanced,0.32441065708796185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,4,power_law_1.2,0.3679935932159424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,balanced,0.13061333696047464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,4,power_law_1.2,0.5150335788726806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,balanced,0.14283733566602072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,4,power_law_1.2,0.6896704196929931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,balanced,0.4607626597086589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,4,power_law_1.2,0.9931008338928222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,balanced,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,balanced,0.16850133736928305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,balanced,0.04180799921353658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,4,power_law_1.2,1.5911359786987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,power_law_1.01,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,balanced,0.045797333121299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,balanced,0.18729066848754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,4,power_law_1.2,1.7885631561279296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,balanced,0.06229866544405619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,balanced,0.08710400263468425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,power_law_1.01,0.04232960045337677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,4,power_law_1.2,2.311782455444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,balanced,0.5671039819717407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,balanced,0.08896000186602275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,balanced,0.25303467114766437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,power_law_1.01,0.05882880091667175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,balanced,0.09150933225949605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,balanced,0.09199999769528706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,4,power_law_1.2,4.25030403137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,power_law_1.01,0.07434880137443542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,balanced,0.09333333373069763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,power_law_1.01,0.11199359893798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,balanced,0.3006613254547119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,balanced,0.09496532877286275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,4,power_law_1.2,7.536921691894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,power_law_1.01,0.11313920021057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,balanced,0.09851732850074768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,power_law_1.01,0.11894400119781494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,balanced,0.10034132997194926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,balanced,0.10408533612887065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,power_law_1.01,0.12390400171279907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,balanced,0.8157066504160563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,balanced,0.4370933373769124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,balanced,0.10872532924016316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,power_law_1.01,0.03461759984493255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,power_law_1.01,0.12503679990768432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,power_law_1.01,0.12688640356063843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,power_law_1.01,0.03298560082912445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,power_law_1.01,0.13497600555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,power_law_1.01,0.03824000060558319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,balanced,0.585482676823934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,balanced,0.12065600355466206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,power_law_1.01,0.05221760272979736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,power_law_1.01,0.13835519552230835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,power_law_1.01,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,balanced,0.12204266587893169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,power_law_1.01,0.1417407989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,power_law_1.01,0.07959679961204529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,power_law_1.01,0.14896639585494995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,balanced,1.068837324778239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,power_law_1.01,0.0801472008228302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,power_law_1.01,0.15134079456329347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,power_law_1.01,0.08513919711112976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,power_law_1.01,0.1615679979324341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,power_law_1.01,0.08572800159454345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,balanced,0.856607993443807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,power_law_1.01,0.1794111967086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,power_law_1.01,0.08748800158500672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,balanced,0.140474667151769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,power_law_1.01,0.09321600198745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,power_law_1.01,0.19299839735031127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,power_law_1.01,0.09468799829483032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,balanced,0.16446399688720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,power_law_1.01,0.22737278938293456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,power_law_1.01,0.09937919974327088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,balanced,0.17460266749064127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,power_law_1.01,0.10113919973373413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,power_law_1.01,0.27171199321746825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,power_law_1.01,0.11281919479370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,balanced,0.23695999383926392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,balanced,1.3207200368245442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,power_law_1.01,0.34294400215148924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,power_law_1.01,0.11431039571762085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,balanced,1.1302186648050945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,balanced,0.287663996219635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,power_law_1.01,0.12398079633712769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,power_law_1.01,0.37090559005737306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,power_law_1.01,0.1423616051673889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,power_law_1.01,0.15384960174560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,balanced,0.41999467213948566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,power_law_1.01,0.4809088230133057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,power_law_1.01,0.18545279502868653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,power_law_1.01,0.21914238929748536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,power_law_1.01,0.29971840381622317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,power_law_1.01,0.6578112125396729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,balanced,0.5039519866307577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,power_law_1.01,0.343724799156189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,power_law_1.01,0.8982784271240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,power_law_1.01,0.5007423877716064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,power_law_1.01,1.20698881149292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,power_law_1.01,0.5971968173980713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,balanced,1.4073707262674968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,power_law_1.01,1.4636351585388183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,balanced,0.7457013130187988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,power_law_1.01,0.9059583663940429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,power_law_1.01,2.3049856185913087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,power_law_1.01,1.1650176048278809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,power_law_1.01,1.5319487571716308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,power_law_1.01,4.678764724731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,power_law_1.01,2.4096960067749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,balanced,0.985584020614624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,balanced,2.0758132934570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,power_law_1.01,5.061171340942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,power_law_1.01,0.039263999462127684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,power_law_1.01,0.04371840059757233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,balanced,1.4537067413330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,power_law_1.01,0.0465472012758255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,power_law_1.01,0.05501440167427063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,power_law_1.01,0.06232960224151611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,2,power_law_1.2,0.03440000116825104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,balanced,2.2307519912719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,power_law_1.01,0.08313599824905396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,2,power_law_1.2,0.03296639919281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,power_law_1.01,0.08478080034255982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,2,power_law_1.2,0.039827200770378116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,2,power_law_1.2,0.05716480016708374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,power_law_1.01,0.08750720024108886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,balanced,1.9101440111796062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,2,power_law_1.2,0.06967679858207702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,power_law_1.01,0.09144319891929627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,2,power_law_1.2,0.11074559688568116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,power_law_1.01,0.09452160000801087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,2,power_law_1.2,0.11424000263214111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,power_law_1.01,0.09960319995880126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,2,power_law_1.2,0.12264319658279418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,power_law_1.01,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,2,power_law_1.2,0.12515840530395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,power_law_1.01,0.10797439813613892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,power_law_1.01,0.1184000015258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,2,power_law_1.2,0.12697600126266478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,2,power_law_1.2,0.1322175979614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,2,power_law_1.2,0.13596160411834718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,balanced,2.376592000325521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,power_law_1.01,0.1261952042579651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,2,power_law_1.2,0.13634560108184815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,2,power_law_1.2,0.14641280174255372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,power_law_1.01,0.13896960020065308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,2,power_law_1.2,0.15160319805145264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,2,power_law_1.2,0.15752320289611815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,2,power_law_1.2,0.1636288046836853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,power_law_1.01,0.1449280023574829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,2,power_law_1.2,0.1810495972633362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,balanced,4.0808000564575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,power_law_1.01,0.17632639408111572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,2,power_law_1.2,0.2015552043914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,power_law_1.01,0.2013375997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,2,power_law_1.2,0.2291264057159424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,power_law_1.01,0.2776128053665161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,2,power_law_1.2,0.296345591545105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,power_law_1.01,0.3341439962387085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,2,power_law_1.2,0.3617664098739624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,2,power_law_1.2,0.3948800086975098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,power_law_1.01,0.4825984001159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,2,power_law_1.2,0.492307186126709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,power_law_1.01,0.6009471893310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,balanced,3.7415574391682944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,balanced,4.208703994750977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,power_law_1.01,0.9062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,2,power_law_1.2,0.7364160060882569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,power_law_1.01,1.0483263969421386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,2,power_law_1.2,0.9286335945129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,power_law_1.01,1.6587135314941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,2,power_law_1.2,1.3060799598693849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,power_law_1.01,2.3709695816040037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,2,power_law_1.2,1.6202816009521483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,power_law_1.01,2.6260351181030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,2,power_law_1.2,2.300934410095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,power_law_1.01,4.224499130249024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,2,power_law_1.2,4.79675521850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,2,power_law_1.2,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,power_law_1.01,8.89416961669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,2,power_law_1.2,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,2,power_law_1.2,0.03999359905719757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,2,power_law_1.2,0.04656000137329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,2,power_law_1.2,0.05690240263938904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,2,power_law_1.2,0.08073599934577942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,2,power_law_1.2,0.08058879971504211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,2,power_law_1.2,0.08538240194320679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,2,power_law_1.2,0.08737919926643371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,2,power_law_1.2,0.08882560133934021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,2,power_law_1.2,0.09205120205879211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,2,power_law_1.2,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,2,power_law_1.2,0.10062079429626465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,2,power_law_1.2,0.10398720502853394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,2,power_law_1.2,0.11005439758300781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,2,power_law_1.2,0.11615359783172607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,2,power_law_1.2,0.12648320198059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,2,power_law_1.2,0.14127999544143677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,2,power_law_1.2,0.16224000453948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,2,power_law_1.2,0.18643200397491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,balanced,7.400805155436198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,2,power_law_1.2,0.2309823989868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,2,power_law_1.2,0.29153919219970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,2,power_law_1.2,0.3737407922744751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,2,power_law_1.2,0.4994815826416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,2,power_law_1.2,0.6751872062683105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,2,power_law_1.2,1.016096019744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,2,power_law_1.2,1.3059391975402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,2,power_law_1.2,1.5900608062744142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,2,power_law_1.2,2.5728960037231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,2,power_law_1.2,6.147609710693359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,balanced,0.030389333764712017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,balanced,0.035445332527160645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,balanced,0.05126399795214335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,2,power_law_1.2,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,balanced,0.07951466739177704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,balanced,0.13115732868512472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,2,power_law_1.2,0.04439679980278015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,balanced,0.13108266393343607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,2,power_law_1.2,0.04519680142402649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,balanced,0.1311199963092804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,2,power_law_1.2,0.05395200252532959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,balanced,0.13269866506258646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,2,power_law_1.2,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,balanced,0.13378133376439413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,2,power_law_1.2,0.0830847978591919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,balanced,0.1341493328412374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,2,power_law_1.2,0.08650239706039428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,balanced,0.13596266508102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,2,power_law_1.2,0.08835840225219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,balanced,0.13943466544151306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,2,power_law_1.2,0.09523839950561523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,balanced,0.14255999525388083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,2,power_law_1.2,0.0958079993724823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,balanced,0.14550399780273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,2,power_law_1.2,0.10225919485092164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,balanced,0.15678399801254272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,2,power_law_1.2,0.10677119493484497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,2,power_law_1.2,0.11089919805526734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,balanced,0.1616106629371643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,2,power_law_1.2,0.12167680263519287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,balanced,0.1774079998334249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,balanced,0.20225600401560465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,2,power_law_1.2,0.13051520586013793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,balanced,0.21562665700912476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,2,power_law_1.2,0.13850239515304566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,balanced,0.2500800093015035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,2,power_law_1.2,0.15194239616394042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,balanced,0.26337599754333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,2,power_law_1.2,0.17847039699554443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,2,power_law_1.2,0.20177919864654542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,balanced,0.37830400466918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,2,power_law_1.2,0.27631359100341796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,2,power_law_1.2,0.3673727989196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,balanced,0.42182401816050213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,2,power_law_1.2,0.45632638931274416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,2,power_law_1.2,0.6011712074279785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,2,power_law_1.2,0.932198429107666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,2,power_law_1.2,1.2185983657836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,balanced,0.65720534324646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,2,power_law_1.2,1.7637567520141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,balanced,0.03745600084463755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,balanced,0.03751466671625773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,2,power_law_1.2,2.191334342956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,balanced,0.043466667334238686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,balanced,0.06621333460013072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,2,power_law_1.2,2.8280832290649416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,balanced,0.8807893594106039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,balanced,0.0949173370997111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,balanced,0.09624000390370686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,2,power_law_1.2,4.470111846923828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,balanced,0.0971999963124593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,balanced,0.09749866525332133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,2,power_law_1.2,8.638285064697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,balanced,0.09987200299898784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,balanced,0.10126933455467224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,balanced,0.1037600040435791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,balanced,0.10786666472752889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,balanced,1.3338559468587239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,balanced,0.11116266250610352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,balanced,0.11672533551851909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,balanced,0.1251306633154551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,balanced,0.13153599699338278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,balanced,0.06128533184528351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,balanced,0.14924266934394836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,balanced,0.06504000226656596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,balanced,0.1732106606165568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,balanced,0.06753066678841908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,balanced,0.08214400211970012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,balanced,0.1890666683514913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,power_law_1.01,0.03544960021972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,balanced,1.7476800282796223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,balanced,0.10914132992426555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,power_law_1.01,0.029631999135017396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,balanced,0.23197867472966513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,power_law_1.01,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,balanced,0.11370133360226949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,power_law_1.01,0.0351936012506485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,power_law_1.01,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,balanced,0.11453333497047424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,balanced,0.2690826654434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,balanced,0.11731200416882832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,power_law_1.01,0.05356799960136414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,power_law_1.01,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,balanced,0.12082133690516154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,power_law_1.01,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,power_law_1.01,0.05766400098800659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,balanced,0.12363732854525249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,balanced,0.38885335127512616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,power_law_1.01,0.08526719808578491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,power_law_1.01,0.07352960109710693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,balanced,0.12666666507720947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,power_law_1.01,0.08915200233459472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,power_law_1.01,0.11487360000610351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,balanced,0.13503467043240866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,power_law_1.01,0.09137920141220093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,balanced,0.47470398743947345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,balanced,0.13928533593813577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,power_law_1.01,0.11715840101242066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,power_law_1.01,0.09591040015220642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,balanced,2.1938986778259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,balanced,0.1448906660079956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,power_law_1.01,0.1223680019378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,power_law_1.01,0.098854398727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,power_law_1.01,0.12961280345916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,power_law_1.01,0.10592639446258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,balanced,0.6831200122833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,power_law_1.01,0.1300160050392151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,power_law_1.01,0.11331839561462402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,power_law_1.01,0.11759999990463257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,power_law_1.01,0.13728640079498292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,balanced,0.1654933293660482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,power_law_1.01,0.12225279808044434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,power_law_1.01,0.143231999874115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,balanced,0.1696000099182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,power_law_1.01,0.130239999294281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,power_law_1.01,0.14816639423370362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,balanced,0.934613307317098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,power_law_1.01,0.14188799858093262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,power_law_1.01,0.15441279411315917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,power_law_1.01,0.15530879497528077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,power_law_1.01,0.052883201837539674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,power_law_1.01,0.16088320016860963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,power_law_1.01,0.18511999845504762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,power_law_1.01,0.06206079721450806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,power_law_1.01,0.20122239589691163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,power_law_1.01,0.17621760368347167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,power_law_1.01,0.06528000235557556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,balanced,0.20083733399709067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,power_law_1.01,0.07242879867553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,power_law_1.01,0.25287680625915526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,power_law_1.01,0.19051519632339478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,power_law_1.01,0.082150399684906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,balanced,0.2505279978116353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,balanced,1.4597439765930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,power_law_1.01,0.30268158912658694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,power_law_1.01,0.21771519184112548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,power_law_1.01,0.1013375997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,balanced,3.506453196207682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,power_law_1.01,0.1045632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,power_law_1.01,0.40494718551635744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,balanced,0.2869973381360372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.2277888059616089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,power_law_1.01,0.10959359407424926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,power_law_1.01,0.5029248237609864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.2706559896469116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,power_law_1.01,0.11556479930877686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,balanced,0.40305598576863605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,power_law_1.01,0.7111040115356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,power_law_1.01,0.1200063943862915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.29870080947875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,power_law_1.01,0.12572799921035765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,power_law_1.01,0.932703971862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,power_law_1.01,0.39441280364990233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,power_law_1.01,0.13675520420074463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,balanced,0.4739840030670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,power_law_1.01,0.1434623956680298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,power_law_1.01,1.382265567779541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,power_law_1.01,0.4725503921508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,power_law_1.01,0.1591104030609131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,power_law_1.01,0.6607999801635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,power_law_1.01,1.8471359252929687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,balanced,1.9440053304036458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,1,power_law_1.2,0.029651200771331786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,power_law_1.01,0.8501119613647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,power_law_1.01,2.3202688217163088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,balanced,0.7095093727111816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,1,power_law_1.2,0.03544319868087768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,power_law_1.01,0.17375359535217286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,power_law_1.01,1.2370431900024415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,1,power_law_1.2,0.04147199988365173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,power_law_1.01,3.7235649108886717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,power_law_1.01,0.185971200466156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,power_law_1.01,1.6401344299316407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,1,power_law_1.2,0.05373439788818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,balanced,0.8701013724009196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,1,power_law_1.2,0.06846079826354981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,power_law_1.01,2.051590347290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,power_law_1.01,7.50140151977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,1,power_law_1.2,0.11527680158615113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,power_law_1.01,0.2025536060333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,1,power_law_1.2,0.12015360593795776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,power_law_1.01,3.2839935302734373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,1,power_law_1.2,0.12409600019454955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,power_law_1.01,0.25340800285339354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,balanced,1.2881866296132405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,1,power_law_1.2,0.12979840040206908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,power_law_1.01,0.3095360040664673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,power_law_1.01,6.854208374023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,1,power_law_1.2,0.13563519716262817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,balanced,2.421482721964518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,power_law_1.01,0.4177855968475342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,1,power_law_1.2,0.1368064045906067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,power_law_1.01,0.5134016036987304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,1,power_law_1.2,0.14583040475845338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,power_law_1.01,0.703443193435669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,1,power_law_1.2,0.14812159538269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,balanced,1.6974986394246419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,power_law_1.01,0.898521614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,1,power_law_1.2,0.15323519706726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,1,power_law_1.2,0.1639680027961731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,power_law_1.01,1.3073535919189454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,1,power_law_1.2,0.17500799894332886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,power_law_1.01,1.715225601196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,1,power_law_1.2,0.19041919708251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,power_law_1.01,2.515891265869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,1,power_law_1.2,0.2218048095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,power_law_1.01,3.320364761352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,balanced,2.5048160552978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.23023359775543212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.2724992036819458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,power_law_1.01,4.131545639038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,balanced,6.522698720296224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.303769588470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,1,power_law_1.2,0.39930880069732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,power_law_1.01,6.536345672607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,1,power_law_1.2,0.4723519802093506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,1,power_law_1.2,0.6650176048278809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,balanced,3.8592373530069985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,power_law_1.01,12.913888549804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,1,power_law_1.2,0.8591360092163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,1,power_law_1.2,1.2633472442626954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,balanced,3.322506586710612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,1,power_law_1.2,1.6663040161132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,1,power_law_1.2,2.082124710083008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,1,power_law_1.2,3.330873489379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,1,power_law_1.2,6.941395568847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,balanced,4.12938117980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,1,power_law_1.2,0.0352512001991272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,1,power_law_1.2,0.035359999537467955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,1,power_law_1.2,0.03940480053424835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,1,power_law_1.2,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,1,power_law_1.2,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,1,power_law_1.2,0.08604159951210022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,1,power_law_1.2,0.08999680280685425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,1,power_law_1.2,0.09597439765930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,balanced,6.532490412394206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,1,power_law_1.2,0.0985152006149292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,balanced,7.30406379699707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,1,power_law_1.2,0.10389120578765869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,1,power_law_1.2,0.10860799551010132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,1,power_law_1.2,0.11484160423278808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,1,power_law_1.2,0.12295680046081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,1,power_law_1.2,0.12409600019454955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,1,power_law_1.2,0.13299839496612548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,1,power_law_1.2,0.14514559507369995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,1,power_law_1.2,0.1583359956741333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,1,power_law_1.2,0.18889600038528442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,1,power_law_1.2,0.2050112009048462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,1,power_law_1.2,0.25534720420837403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,1,power_law_1.2,0.30215680599212646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,1,power_law_1.2,0.4042304039001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,1,power_law_1.2,0.5071296215057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,1,power_law_1.2,0.7147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,1,power_law_1.2,0.9355456352233886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,1,power_law_1.2,1.4037311553955079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,1,power_law_1.2,1.875040054321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,1,power_law_1.2,2.333625602722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,1,power_law_1.2,3.7482177734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,1,power_law_1.2,7.575539398193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,balanced,12.9476318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,balanced,0.058506667613983154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,balanced,0.07472533484299977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,balanced,0.12417599558830261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,1,power_law_1.2,0.05562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,balanced,0.22550400098164877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,balanced,0.415338675181071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,1,power_law_1.2,0.06250240206718445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,balanced,0.41743465264638263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,1,power_law_1.2,0.06573439836502075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,balanced,0.41923733552296955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,1,power_law_1.2,0.07207679748535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,balanced,0.41699198881785077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,balanced,0.4190080165863037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,1,power_law_1.2,0.07958400249481201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,balanced,0.42026666800181073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,1,power_law_1.2,0.10073599815368653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,balanced,0.42244799931844074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,1,power_law_1.2,0.10631680488586426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,balanced,0.4242560068766276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,balanced,0.42583998044331867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,1,power_law_1.2,0.11246720552444459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,balanced,0.04101866732041041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,balanced,0.43131200472513836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,1,power_law_1.2,0.11771520376205444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,balanced,0.05585066477457682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,balanced,0.4476426839828491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,1,power_law_1.2,0.12171519994735717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,balanced,0.08100800216197968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,balanced,0.13239999612172446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,balanced,0.45445867379506427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,1,power_law_1.2,0.1282688021659851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,balanced,0.2277173399925232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,1,power_law_1.2,0.13853440284729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,balanced,0.46186665693918866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,balanced,0.232314666112264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,balanced,0.2338026762008667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,1,power_law_1.2,0.14465919733047486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,balanced,0.2342453400293986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,balanced,0.47667733828226727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,balanced,0.234607994556427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,1,power_law_1.2,0.1603008031845093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,balanced,0.5030080080032349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,balanced,0.23701866467793783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,balanced,0.2395626703898112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,balanced,0.5278186798095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,balanced,0.040976000328858696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,balanced,0.24241065979003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.01,0.1270143985748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,1,power_law_1.2,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,balanced,0.24541866779327393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,balanced,0.05383466680844625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,1,power_law_1.2,0.18867839574813844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,balanced,0.5502933263778687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.01,0.09836800098419189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,balanced,0.24894932905832926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,balanced,0.07798933486143748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,balanced,0.2560853362083435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.01,0.1350335955619812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,balanced,0.25972266991933185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,balanced,0.1292586624622345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,balanced,0.6381386518478394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.01,0.17651840448379516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,1,power_law_1.2,0.2012864112854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,balanced,0.26665600140889484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,balanced,0.2236106594403585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.01,0.24407680034637452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,1,power_law_1.2,0.25437440872192385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,balanced,0.28177066644032794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,balanced,0.22670932610829672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,balanced,0.7013653119405111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,1,power_law_1.2,0.31030399799346925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.01,0.3595263957977295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,balanced,0.2299626668294271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,balanced,0.29870933294296265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,balanced,0.23076266050338745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,1,power_law_1.2,0.4209472179412842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.01,0.37730560302734373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,balanced,0.32530667384465534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,balanced,0.23276267449061075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,1,power_law_1.2,0.5147647857666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.01,0.3848639965057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,balanced,0.23548267285029092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,balanced,0.9069120089213053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,balanced,0.35546668370564777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,1,power_law_1.2,0.7093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.01,0.39174399375915525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,balanced,0.23876800139745077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,1,power_law_1.2,0.9066176414489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,balanced,0.24213866392771402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.01,0.39139840602874754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,balanced,0.4373013178507487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,balanced,0.24754667282104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,1,power_law_1.2,1.312070369720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.01,0.39697918891906736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,balanced,0.25353066126505536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.01,0.4153855800628662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,1,power_law_1.2,1.7247232437133788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,balanced,1.181440035502116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,balanced,0.49531201521555585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.01,0.41283202171325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,1,power_law_1.2,2.5323392868041994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.01,0.45393919944763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,1,power_law_1.2,3.3364864349365235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,balanced,0.6520959933598837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.01,0.4784575939178467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,balanced,0.26390933990478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,1,power_law_1.2,4.137459182739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.01,0.46625919342041017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,balanced,0.2693600058555603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.01,0.4936255931854248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.01,0.07916799783706666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,balanced,1.6669386227925618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,1,power_law_1.2,6.541222381591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.01,0.5527488231658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.01,0.07443199753761291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,balanced,0.8205333550771078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.01,0.07571200132369996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.01,0.515993595123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.01,0.10805759429931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,1,power_law_1.2,12.915359497070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.01,0.5895232200622559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.01,0.13303680419921876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.01,0.6721407890319824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.01,0.20275840759277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.01,0.8326144218444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.01,0.21711359024047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.01,0.21783039569854737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.01,0.9651583671569824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.01,0.22137598991394042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.01,0.22653439044952392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.01,1.3564031600952149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,balanced,1.1804906527201335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,balanced,0.28651734193166095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,balanced,2.1958559354146323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.01,0.2336064100265503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.01,1.6383295059204102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,balanced,0.3131999969482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.01,0.244704008102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.01,0.24855680465698243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.01,2.4883712768554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,balanced,0.33102933565775555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.01,0.24340479373931884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.01,0.2620543956756592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.01,3.2948543548583986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,balanced,0.39587199687957764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.01,0.26319360733032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.01,0.26956160068511964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.01,3.763417434692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,balanced,0.45051733652750653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.01,0.3201600074768066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,balanced,1.5206507047017415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.01,0.3396735906600952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.01,5.131737518310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.01,0.3934272050857544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,balanced,0.6451733509699503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.01,0.437286376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,balanced,2.716005325317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.01,12.102886199951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.01,0.5164224147796631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.01,0.6496319770812988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,balanced,0.7524693012237549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.01,0.8811327934265136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.01,1.0892736434936523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.01,1.6760704040527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,balanced,1.0863146781921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.01,2.1755903244018553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.01,2.768550491333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,balanced,1.9388586680094402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.12522879838943482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.01,4.188057708740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.1107200026512146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,balanced,1.4299306869506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,power_law_1.01,0.08153600096702576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,4,power_law_1.2,0.14991359710693358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.01,8.251634979248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,4,power_law_1.2,0.20853118896484374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,power_law_1.01,0.07006719708442688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,power_law_1.01,0.07122560143470764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,4,power_law_1.2,0.36963839530944825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,power_law_1.01,0.10454399585723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,4,power_law_1.2,0.39571199417114256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,power_law_1.01,0.13860479593276978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,balanced,4.186613400777181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,4,power_law_1.2,0.38775680065155027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,power_law_1.01,0.20001280307769775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,balanced,2.10972261428833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,4,power_law_1.2,0.4100543975830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,power_law_1.01,0.21203200817108153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,4,power_law_1.2,0.42622079849243166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,power_law_1.01,0.21522560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,4,power_law_1.2,0.4354368209838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,power_law_1.01,0.23327360153198243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,power_law_1.01,0.23069438934326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,4,power_law_1.2,0.4397183895111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,power_law_1.01,0.24622719287872313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,4,power_law_1.2,0.44700798988342283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,power_law_1.01,0.25960960388183596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,balanced,3.0446348190307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,4,power_law_1.2,0.46558079719543455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,power_law_1.01,0.2778048038482666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,4,power_law_1.2,0.4884799957275391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,power_law_1.01,0.28603520393371584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,balanced,2.8181333541870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,4,power_law_1.2,0.523737621307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,4,power_law_1.2,0.5110400199890137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,4,power_law_1.2,0.5803775787353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,power_law_1.01,0.29247360229492186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,4,power_law_1.2,0.5624447822570801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,power_law_1.01,0.30144639015197755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,4,power_law_1.2,0.63854079246521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,4,power_law_1.2,0.7146368026733398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,4,power_law_1.2,0.939084815979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,power_law_1.01,0.3100287914276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,4,power_law_1.2,1.131488037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,power_law_1.01,0.372761607170105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,4,power_law_1.2,1.4613375663757324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.01,0.4170368194580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,4,power_law_1.2,1.9292352676391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.01,0.5118015766143799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,balanced,3.5137599309285483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,4,power_law_1.2,2.8025791168212892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.01,0.6117568016052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.01,0.8496064186096192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,4,power_law_1.2,3.4852672576904298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.01,1.098367977142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,4,power_law_1.2,4.036627197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.01,1.6437055587768554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,4,power_law_1.2,7.4409538269042965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.01,1.779372787475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.01,3.2248256683349608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.01,3.8923648834228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,power_law_1.2,14.055661010742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,4,balanced,8.13259188334147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,power_law_1.01,5.019692611694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,power_law_1.01,8.407673645019532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,power_law_1.01,17.342495727539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,balanced,5.650762557983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,balanced,6.057130813598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,4,power_law_1.2,0.07831040024757385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,4,power_law_1.2,0.05299199819564819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,4,power_law_1.2,0.07662720084190369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,4,power_law_1.2,0.10963200330734253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,4,power_law_1.2,0.11953279972076417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,4,power_law_1.2,0.20874240398406982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,4,power_law_1.2,0.20510718822479249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,4,power_law_1.2,0.22187519073486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,4,power_law_1.2,0.22529280185699463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,4,power_law_1.2,0.23569920063018798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,4,power_law_1.2,0.23995521068572997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,balanced,11.284074147542318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,4,power_law_1.2,0.2505408048629761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,4,power_law_1.2,0.2422271966934204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,4,power_law_1.2,0.2546112060546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,4,power_law_1.2,0.2650943994522095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,4,power_law_1.2,0.08117120265960694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,4,power_law_1.2,0.2862400054931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,4,power_law_1.2,0.05845119953155518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,4,power_law_1.2,0.28190720081329346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,4,power_law_1.2,0.07774080038070678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,4,power_law_1.2,0.3197887897491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,4,power_law_1.2,0.09400960206985473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,4,power_law_1.2,0.33724160194396974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,4,power_law_1.2,0.1265663981437683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,4,power_law_1.2,0.1970752000808716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,4,power_law_1.2,0.4297023773193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,4,power_law_1.2,0.20959999561309814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,4,power_law_1.2,0.4689151763916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,4,power_law_1.2,0.22305281162261964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,4,power_law_1.2,0.5844927787780761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,balanced,0.0580320010582606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,4,power_law_1.2,0.22222719192504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,4,power_law_1.2,0.7121600151062012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,balanced,0.07524266839027405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,4,power_law_1.2,0.23519999980926515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,balanced,0.12520000338554382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,4,power_law_1.2,0.9678144454956055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,4,power_law_1.2,0.24790399074554442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,balanced,0.22517865896224976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,balanced,0.41627200444539386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,4,power_law_1.2,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,4,power_law_1.2,1.155846405029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,balanced,0.42236800988515216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,4,power_law_1.2,0.2751296043395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,4,power_law_1.2,1.7981632232666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,balanced,0.4243946472803752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,balanced,0.42349334557851154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,4,power_law_1.2,0.2876352071762085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,4,power_law_1.2,2.3371135711669924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,balanced,0.42455466588338214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,balanced,0.42605865001678467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,4,power_law_1.2,3.2605312347412108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,balanced,0.4287946621576945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,4,power_law_1.2,0.29827840328216554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,balanced,0.4344746669133504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,balanced,0.4354879856109619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,4,power_law_1.2,0.31318399906158445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,4,power_law_1.2,5.536294555664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,balanced,0.44115734100341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,balanced,0.4574720064798991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,4,power_law_1.2,0.34250240325927733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,balanced,0.4634079933166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,4,power_law_1.2,12.16803207397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,4,power_law_1.2,0.3816512107849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,balanced,0.48068265120188397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,balanced,0.5006186564763387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.2,0.4292543888092041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.2,0.5388991832733154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,balanced,0.5393759806950887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.2,0.7114111900329589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,balanced,0.5725333293279012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.2,0.9670528411865235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,balanced,0.6155840158462524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.2,1.3507840156555175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,balanced,0.7145866552988688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.2,1.6711296081542968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.2,2.2518335342407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,balanced,0.7993706862131754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.2,3.2587966918945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,balanced,0.038405333956082664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.2,4.8559425354003904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,balanced,0.05609600245952606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,balanced,1.073514699935913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,4,power_law_1.2,6.566400146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,balanced,0.0809386670589447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,balanced,0.13523733615875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,balanced,0.23808000485102335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,4,power_law_1.2,8.658975982666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,balanced,0.24150933821996054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,balanced,0.2421600023905436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,balanced,1.3822293281555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,balanced,0.244053324063619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,balanced,0.2465546727180481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,4,power_law_1.2,18.729913330078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,balanced,0.24914133548736572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.01,0.07759360074996949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.01,0.055257600545883176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,balanced,0.2501866618792216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.01,0.07415680289268493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.01,0.05692800283432007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,balanced,0.25390400489171344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.01,0.09751039743423462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,balanced,2.017434597015381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.01,0.06815999746322632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.01,0.15930880308151246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,balanced,0.2558293342590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.01,0.10430079698562622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.01,0.22070400714874266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,balanced,0.26125866174697876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.01,0.3575808048248291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.01,0.13569920063018798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.01,0.3760767936706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,balanced,0.2704906662305196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.01,0.19998079538345337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.01,0.3830080032348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,balanced,0.04901866614818573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.01,0.3889983892440796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,balanced,0.275818665822347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.01,0.20635519027709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.01,0.40254721641540525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,balanced,0.05910933514436086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,balanced,0.29049599170684814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.01,0.4043712139129639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.01,0.22106239795684815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,balanced,0.08218133449554443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.01,0.40369281768798826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,balanced,2.499546686808268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.01,0.22593278884887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,balanced,0.1356000006198883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.01,0.43540477752685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,balanced,0.31353600819905597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,balanced,0.23058666785558066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.01,0.4550464153289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.01,0.2253119945526123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,balanced,0.23553067445755005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.01,0.4800704002380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,balanced,0.3365066846211751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.01,0.2360703945159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,balanced,0.24014399449030557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.01,0.4718592166900635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.01,0.49646720886230467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,balanced,0.24088533719380698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.01,0.24583680629730226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,balanced,0.37909865379333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.01,0.5456768035888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,balanced,0.24450665712356567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.01,0.24801280498504638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.01,0.5558976173400879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,balanced,0.24856533606847128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,balanced,0.4230560064315796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.01,0.25870718955993655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.01,0.6105088233947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,balanced,0.25331199169158936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.01,0.683846378326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.01,0.26689920425415037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,balanced,0.2597653269767761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.01,0.8236607551574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.01,0.27533440589904784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,balanced,0.5335679848988851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.01,1.0054783821105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,balanced,0.26580800612767536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,balanced,3.0814294815063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.01,0.28696959018707274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.01,1.367155170440674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,balanced,0.2746613423029582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.01,0.3261375904083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.01,1.6807104110717774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,balanced,0.6261653502782186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.01,0.3554752111434937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.01,2.3771968841552735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.01,0.4018432140350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.01,3.1335487365722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.01,0.4592832088470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.01,3.6136638641357424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,balanced,0.2905760010083516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,balanced,0.8521813551584879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.01,0.5731008052825928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,balanced,0.2975359956423442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.01,6.044371032714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.01,0.6865471839904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.01,12.874298095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.01,0.9576831817626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,balanced,1.0970880190531414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.01,1.3066240310668946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.01,1.7345727920532226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.01,2.3209983825683596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,balanced,0.3220319946606954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,power_law_1.01,0.06455039978027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,balanced,5.1336320241292315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.01,2.901363182067871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,balanced,0.3747200171152751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,power_law_1.01,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,power_law_1.01,0.07329919934272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.01,4.692192077636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,balanced,0.4203039805094401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,balanced,1.5908907254536946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,power_law_1.01,0.10249600410461426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,balanced,0.527184009552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,power_law_1.01,0.14132479429244996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.01,9.9391357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,power_law_1.01,0.21006081104278565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,balanced,0.609226663907369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,power_law_1.01,0.2171583890914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,power_law_1.01,0.22597119808197022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,balanced,0.9155893325805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,power_law_1.01,0.2432255983352661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,power_law_1.01,0.23914880752563478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,power_law_1.01,0.2545088052749634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,balanced,2.1717440287272134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,power_law_1.01,0.26467840671539306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,balanced,1.096549352010091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,power_law_1.01,0.2792896032333374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,power_law_1.01,0.3015360116958618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,power_law_1.01,0.30820479393005373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,balanced,1.5940106709798176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,power_law_1.01,0.32476799488067626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,power_law_1.01,0.3413503885269165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,balanced,2.6715466181437173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,balanced,2.0974666277567544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,power_law_1.01,0.4161664009094238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,power_law_1.01,0.5034560203552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,power_law_1.01,0.6022079944610595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,power_law_1.01,0.7609792232513428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,power_law_1.01,1.030617618560791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,power_law_1.01,1.3513471603393554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,balanced,3.1301492055257163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,power_law_1.01,1.9281919479370118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,balanced,10.291925430297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,power_law_1.01,2.418400001525879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,2,power_law_1.2,0.07676799893379212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,power_law_1.01,3.4372222900390623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,2,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,power_law_1.01,4.726073455810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,2,power_law_1.2,0.10153599977493286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,2,power_law_1.2,0.1394495964050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,power_law_1.01,5.920185470581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,2,power_law_1.2,0.20689918994903564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,balanced,4.096768061319987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,2,power_law_1.2,0.35062398910522463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,power_law_1.01,9.134432220458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,balanced,4.127744038899739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,2,power_law_1.2,0.38592000007629396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,2,power_law_1.2,0.3977152109146118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,power_law_1.01,17.887936401367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,2,power_law_1.2,0.40900478363037107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,2,power_law_1.2,0.40276479721069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,2,power_law_1.2,0.4220479965209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,2,power_law_1.2,0.42420477867126466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,2,power_law_1.2,0.45255041122436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,2,power_law_1.2,0.4618048191070557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,2,power_law_1.2,0.05370879769325256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,2,power_law_1.2,0.48076162338256834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,balanced,5.139247894287109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,2,power_law_1.2,0.050835198163986205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,2,power_law_1.2,0.4856128215789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,2,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,2,power_law_1.2,0.5140416145324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,2,power_law_1.2,0.09203839898109437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,2,power_law_1.2,0.5661952018737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,2,power_law_1.2,0.11505919694900513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,2,power_law_1.2,0.5769599914550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,2,power_law_1.2,0.20135679244995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,2,power_law_1.2,0.6235072135925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,2,power_law_1.2,0.2164992094039917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,2,power_law_1.2,0.7186048030853271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,2,power_law_1.2,0.230515193939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,2,power_law_1.2,0.8945535659790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,2,power_law_1.2,0.22795519828796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,2,power_law_1.2,1.1193856239318847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,2,power_law_1.2,0.22797439098358155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,2,power_law_1.2,1.4563072204589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,2,power_law_1.2,0.23619840145111085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,2,power_law_1.2,1.8249919891357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,2,power_law_1.2,0.24927361011505128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,2,power_law_1.2,2.461311912536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,2,power_law_1.2,0.25420799255371096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,2,power_law_1.2,0.26041600704193113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,2,power_law_1.2,3.1544832229614257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,balanced,8.211141586303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,2,power_law_1.2,0.2700671911239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,2,power_law_1.2,0.28989439010620116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,2,power_law_1.2,4.0659137725830075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,2,power_law_1.2,0.29923200607299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,2,power_law_1.2,0.3303168058395386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,2,power_law_1.2,6.2337791442871096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,2,power_law_1.2,0.3631488084793091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,balanced,8.556053161621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,2,power_law_1.2,0.4140031814575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,2,power_law_1.2,13.626535034179687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,2,power_law_1.2,0.4790207862854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,2,power_law_1.2,0.6129087924957275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,2,power_law_1.2,0.7725696086883544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,2,power_law_1.2,0.9921855926513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,2,power_law_1.2,1.3346176147460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,2,power_law_1.2,1.8823104858398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,2,power_law_1.2,2.495859146118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,2,power_law_1.2,3.3678657531738283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,2,power_law_1.2,5.346790313720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,2,power_law_1.2,0.06417919993400574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,2,power_law_1.2,10.218515014648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,2,power_law_1.2,0.05400320291519165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,2,power_law_1.2,0.07315840125083924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,2,power_law_1.2,0.09339519739151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,balanced,0.0544106662273407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,2,power_law_1.2,0.11998720169067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,balanced,0.07544533411661784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,2,power_law_1.2,0.20245120525360108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,balanced,0.1264693339665731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,balanced,16.47115198771159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,balanced,0.22894400358200073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,2,power_law_1.2,0.22064640522003173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,balanced,0.4188266595204671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,balanced,0.4273333152135213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,2,power_law_1.2,0.2218048095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,balanced,0.4317226807276408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,2,power_law_1.2,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,balanced,0.43370668093363446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,2,power_law_1.2,0.25445759296417236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,balanced,0.4322773218154907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,2,power_law_1.2,0.268723201751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,balanced,0.43826134999593097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,balanced,0.43877331415812176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,2,power_law_1.2,0.26552319526672363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,balanced,0.44411734739939374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,2,power_law_1.2,0.2840384006500244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,balanced,0.44978133837382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,2,power_law_1.2,0.3121151924133301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,balanced,0.4572746753692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,balanced,0.4766346613566081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,balanced,0.48265600204467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,balanced,0.5090399980545044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,2,power_law_1.2,0.32181758880615235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,balanced,0.5516853332519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,2,power_law_1.2,0.33802878856658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,balanced,0.585973342259725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,balanced,0.6532800197601318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,2,power_law_1.2,0.3535680055618286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,balanced,0.7294399738311768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,balanced,0.04186133543650309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,2,power_law_1.2,0.42590718269348143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,balanced,0.9024213155110677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,2,power_law_1.2,0.5030399799346924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,balanced,0.0572213331858317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,balanced,0.08430400490760803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,2,power_law_1.2,0.6550655841827393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,balanced,0.13648533821105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,2,power_law_1.2,0.7507904052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,balanced,1.0773013432820637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,balanced,0.23600532611211142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,2,power_law_1.2,1.066592025756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,balanced,0.23760000864664713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,2,power_law_1.2,1.3914175987243653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,balanced,0.23995733261108398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,balanced,0.24266133705774942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,2,power_law_1.2,2.101171112060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,balanced,0.24563199281692505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,balanced,1.4480853080749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,2,power_law_1.2,2.6965951919555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,balanced,0.24768000841140747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,balanced,0.25196800629297894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,2,power_law_1.2,4.2674304962158205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,balanced,0.2567360003789266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,balanced,0.26521066824595135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,2,power_law_1.2,5.564134216308593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,balanced,0.27113600571950275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,balanced,1.8370879491170247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,balanced,0.28497066100438434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,2,power_law_1.2,6.040742492675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,balanced,0.29527999957402545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,balanced,0.3195040027300517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,2,power_law_1.2,11.176914978027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,balanced,0.3572746515274048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,balanced,0.07043200234572093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,balanced,0.38203199704488117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,balanced,0.07572266459465027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,balanced,0.44785598913828534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,balanced,2.6631360054016113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,2,power_law_1.2,20.7461181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,balanced,0.0990666647752126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,balanced,0.5170133511225382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,balanced,0.15160533785820007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,balanced,0.2550613284111023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,balanced,0.2614506681760152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,balanced,0.7222080230712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,balanced,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,balanced,0.270959993203481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,balanced,0.8981653054555258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,balanced,0.27585599819819134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,balanced,0.28146133820215863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,balanced,3.535578727722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,balanced,0.28993066151936847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,balanced,1.287061293919881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,balanced,0.3008799950281779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,balanced,0.31011199951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,balanced,0.32316799958546955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,balanced,1.6830827395121257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,balanced,0.34885334968566895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,balanced,4.373711903889974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,balanced,0.36815468470255536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,balanced,2.516421318054199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.052985602617263795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,balanced,0.4392373164494832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.01,0.03806720077991486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.0584384024143219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,balanced,0.5348266760508219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.01,0.0462336003780365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.09759359955787658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.01,0.07011839747428894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,balanced,3.312682787577311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,balanced,0.5941760142644247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.01,0.10033919811248779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.15777280330657958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.01,0.12868479490280152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,balanced,0.790986696879069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.01,0.20405120849609376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.21267199516296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.01,0.2186880111694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.3540096044540405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.01,0.22892160415649415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,balanced,0.9309333165486654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.3774399995803833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.01,0.2310528039932251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.3884608030319214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,balanced,6.695498784383138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.01,0.2535232067108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.3912960052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,balanced,1.4152320226033528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.01,0.26306560039520266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.40360321998596194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.01,0.2791680097579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.40358400344848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.01,0.2862335920333862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.42674560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,balanced,1.7506720225016277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,balanced,4.16590944925944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.01,0.2958847999572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.46512641906738283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.01,0.3117759943008423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.01,0.33207039833068847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.44475522041320803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.01,0.3839679956436157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.4852608203887939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.01,0.41048321723937986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,balanced,2.5798452695210776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.49747838973999026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.01,0.48572797775268556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.01,0.5707903861999511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.5267327785491943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.01,0.7394239902496338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.5931519985198974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,power_law_1.01,0.06259199976921082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.01,0.9009471893310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.6098944187164307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.01,1.2654848098754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.7019199848175048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,balanced,3.4125493367513022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,power_law_1.01,0.07251200079917908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.01,1.6598783493041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.7784319877624511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,power_law_1.01,0.08675839900970458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.01,2.4413120269775392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.9559935569763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.01,3.210406494140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.05268480181694031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,power_law_1.01,0.11863679885864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.01,3.9869823455810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.01,1.1111359596252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,power_law_1.01,0.14324480295181274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.0597055971622467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,power_law_1.01,0.21823999881744385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.01,1.5565055847167968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.09122560024261475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.01,6.513247680664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,power_law_1.01,0.23739519119262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.1369472026824951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,balanced,6.06710942586263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,balanced,5.04091739654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.9834239959716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,power_law_1.01,0.24705278873443604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.20016000270843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.01,13.304421997070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.01,2.8608448028564455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.3546816110610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,power_law_1.01,0.2640064001083374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,power_law_1.01,0.26467840671539306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.3817536115646362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.01,3.669625473022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,power_law_1.01,0.2864896059036255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.3942080020904541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.01,4.536435317993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.40913920402526854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,power_law_1.01,0.3050816059112549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.42206082344055174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,power_law_1.01,0.3234368085861206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.01,6.801241302490235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.43299198150634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,power_law_1.01,0.3460223913192749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,balanced,6.657898585001628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.4429632186889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.4677055835723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.01,14.594674682617187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.4635903835296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,power_law_1.01,0.3681600093841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,balanced,13.264592488606771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.487059211730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,power_law_1.01,0.39594879150390627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.5008063793182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.5245888233184814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,power_law_1.01,0.4407936096191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.5883520126342774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,1,power_law_1.2,0.6156352043151856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,power_law_1.01,0.5553215980529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.7080575942993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.01,0.6492288112640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,balanced,8.425717035929361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.7886591911315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.01,0.8295552253723144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.9859264373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.01,1.018560028076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,1,power_law_1.2,1.1569727897644042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.01,1.428377628326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,1,power_law_1.2,1.5932607650756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.01,1.8353343963623048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,1,power_law_1.2,2.0114879608154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.01,2.6456319808959963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,1,power_law_1.2,2.907302474975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.01,3.457004928588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,1,power_law_1.2,3.7417152404785154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.01,5.071295928955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,balanced,12.520362854003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,1,power_law_1.2,4.52606086730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.01,6.683929443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.041126400232315063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,1,power_law_1.2,6.779679870605468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.01,8.305107116699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.04886400103569031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,1,power_law_1.2,14.558387756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,power_law_1.01,13.127743530273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,balanced,13.28374989827474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.1161344051361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,power_law_1.01,26.095852661132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.20444800853729247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.2232640027999878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.23050880432128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.23508479595184326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.24280319213867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.25419518947601316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.2663232088088989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.2718400001525879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.2819135904312134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.2996223926544189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,1,power_law_1.2,0.31258881092071533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,1,power_law_1.2,0.3330687999725342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,1,power_law_1.2,0.3793728113174438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,0.41011838912963866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,0.49134078025817873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,0.5756927967071533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,0.7335296154022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,0.9066495895385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,1.2777024269104005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,balanced,26.49194081624349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,1.664076805114746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,2.429318428039551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,3.1761856079101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,1,power_law_1.2,3.9310462951660154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,1,power_law_1.2,6.516659545898437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,1,power_law_1.2,12.946150207519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,1,power_law_1.2,0.06282879710197449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,1,power_law_1.2,0.07152000069618225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,1,power_law_1.2,0.08444160223007202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,1,power_law_1.2,0.11193599700927734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,1,power_law_1.2,0.13114880323410033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,balanced,0.1197813351949056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,1,power_law_1.2,0.22846720218658448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,1,power_law_1.2,0.23916800022125245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,balanced,0.15934933225313822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,balanced,0.0775786687930425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,1,power_law_1.2,0.25474560260772705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,balanced,0.2859039902687073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,balanced,0.5304640134175619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,1,power_law_1.2,0.2712831974029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,balanced,1.0138346354166667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,balanced,0.10547199845314026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,1,power_law_1.2,0.2782912015914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,balanced,1.2693440119425456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,1,power_law_1.2,0.28947839736938474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,balanced,0.1663146714369456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,1,power_law_1.2,0.3141824007034302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,balanced,1.2731413046518962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,balanced,0.28988800446192425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,1,power_law_1.2,0.3239295959472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,balanced,1.2721013228098552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,balanced,0.534447987874349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,1,power_law_1.2,0.3540544033050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,balanced,1.275546630223592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,balanced,0.6579999923706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,balanced,1.2805333137512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,balanced,0.6617546478907267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,balanced,0.6620266834894816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,1,power_law_1.2,0.3749887943267822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,balanced,1.2860693136850994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,balanced,0.666645328203837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,1,power_law_1.2,0.4104896068572998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,balanced,0.6687093575795492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,balanced,1.2889973322550456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,balanced,0.6753919919331869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,balanced,1.2961013317108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,balanced,0.6780959765116373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,1,power_law_1.2,0.45016961097717284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,balanced,1.314143975575765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,balanced,0.6827253500620524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,1,power_law_1.2,0.5582911968231201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,balanced,1.3210293451944988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,balanced,0.6915679772694906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.2,0.6593023777008057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,balanced,1.3276159763336182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,balanced,0.707157293955485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.2,0.8400575637817382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,balanced,0.7089227040608724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,balanced,1.3429226875305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.2,1.040435218811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,balanced,0.7246987024943033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.2,1.4517824172973632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,balanced,1.3787360191345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.2,1.854924774169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,balanced,0.7529813448588053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,balanced,1.4087413152058919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.2,2.671980857849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,balanced,0.7763413588205973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.2,3.488140869140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,balanced,1.4983146985371907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,balanced,0.8993226687113444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.2,5.130188751220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.01,0.2871488094329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,balanced,1.5290932655334473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.2,6.739116668701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,balanced,0.07489066819349925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.16462719440460205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.01,0.412230396270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,balanced,0.8712426821390787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.2,8.375660705566407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,balanced,0.10618133346239726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.01,0.27714560031890867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,balanced,2.4652746518452964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.25315840244293214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,balanced,0.18668266137441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.01,0.4305408000946045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,balanced,1.3142720063527424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.01,0.1418176054954529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,1,power_law_1.2,13.274566650390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,balanced,0.2876266638437907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.01,0.6532351970672607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.01,0.22576639652252198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,balanced,0.5243306557337443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,balanced,1.7818773587544758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.01,0.9752063751220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,balanced,1.1259733041127522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,balanced,0.6510026852289835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.01,0.3379199981689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,1,power_law_1.2,26.295059204101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.01,1.0272128105163574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,balanced,0.6557439963022867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.01,0.5197567939758301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.01,1.094816017150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,balanced,0.658186674118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,balanced,2.8978614807128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.01,0.5487040042877197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,balanced,0.6631253163019816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.01,1.042080020904541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,balanced,1.7995786666870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,balanced,0.6658186515172323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.01,1.138809585571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.01,0.583673620223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,balanced,0.6731359958648682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.01,1.1428352355957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,balanced,0.6797280311584473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.01,0.5839168071746826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,balanced,3.0345331827799478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.01,1.2375935554504394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,balanced,0.6857706705729166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.01,0.5993279933929443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,balanced,2.167520046234131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,balanced,0.6980960369110107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.01,1.2811391830444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.01,0.6217023849487304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,balanced,0.7149120171864828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.01,1.2332223892211913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.01,0.6410687923431396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.01,1.335756778717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.01,0.6987199783325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.01,1.3865983963012696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,balanced,3.7753067016601562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.01,1.4665727615356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.01,0.6833343982696534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,balanced,2.598896026611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,balanced,0.7264426549275717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.01,1.6793407440185546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.01,0.7070464134216309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.01,1.6885631561279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.01,1.96441593170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.01,0.7316544055938721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.01,2.1877952575683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.01,0.733081579208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.01,2.5540416717529295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,balanced,0.7497813701629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,power_law_1.01,0.1729599952697754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.01,0.781612777709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,balanced,5.385199864705403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.01,2.559519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,power_law_1.01,0.24698240756988527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,balanced,3.5708745320638022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,0.8576191902160645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.01,3.3131519317626954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,power_law_1.01,0.14737279415130616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.01,4.294099044799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,power_law_1.01,0.2492608070373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,1.0402751922607423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,power_law_1.01,0.3119359970092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.01,6.026950454711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,1.1271295547485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,power_law_1.01,0.5231359958648681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,power_law_1.01,0.572486400604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,1.487660789489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.01,7.362662506103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,power_law_1.01,0.5668416023254395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,balanced,0.8004159927368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,1.6062463760375976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,power_law_1.01,0.602016019821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.01,9.506604766845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,1.9903999328613282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,balanced,0.8531520366668701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,power_law_1.01,0.6184000015258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,balanced,5.756079991658528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,power_law_1.01,0.6587776184082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,balanced,0.9548693497975668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,2.737779235839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.01,13.319705200195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,power_law_1.01,0.6767295837402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,balanced,3.9045492808024087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,4,power_law_1.2,0.286297607421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,power_law_1.01,0.7403264045715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,3.5249088287353514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,balanced,1.0528266429901123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,4,power_law_1.2,0.172435200214386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,power_law_1.01,0.8177472114562988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,power_law_1.01,0.8689663887023926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,4,power_law_1.2,0.23255040645599365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,4.464019012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.01,29.68187561035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,balanced,1.4751572608947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,4,power_law_1.2,0.40464000701904296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.01,4.720281600952148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,4,power_law_1.2,0.5311615943908692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,power_law_1.01,0.806163215637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,4,power_law_1.2,0.9144191741943359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,balanced,1.6625866889953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.01,8.97228775024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,4,power_law_1.2,1.065567970275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,power_law_1.01,0.8909952163696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,4,power_law_1.2,1.1660223960876466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.01,19.82532501220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,4,power_law_1.2,1.2001024246215821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,balanced,2.4453813234965005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,power_law_1.01,0.8937088012695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,4,power_law_1.2,1.2128576278686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,balanced,9.710469563802084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.01,1.0600064277648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,4,power_law_1.2,1.2166015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.01,1.1209792137145995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,balanced,6.729951858520508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.01,1.3079680442810058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,4,power_law_1.2,1.344166374206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,balanced,3.254021326700846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.01,1.8297216415405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,4,power_law_1.2,1.409209632873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.01,2.142739105224609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,4,power_law_1.2,1.2777024269104005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.01,3.2973953247070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,4,power_law_1.2,1.4197440147399902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.01,4.076319885253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,4,power_law_1.2,1.399129581451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.01,6.3434497833251955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,balanced,4.498192151387532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,4,power_law_1.2,1.5147839546203614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.01,7.533734130859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,4,power_law_1.2,1.7568319320678711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,power_law_1.01,10.127865600585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,4,power_law_1.2,1.705036735534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,4,power_law_1.2,2.2392192840576173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,power_law_1.01,16.1210693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,4,power_law_1.2,2.2132863998413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,4,power_law_1.2,2.813395118713379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,4,power_law_1.2,2.7930559158325194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,power_law_1.01,36.23672180175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,4,power_law_1.2,3.4178302764892576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,balanced,6.181925455729167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,4,power_law_1.2,4.832134246826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,4,power_law_1.2,7.917420959472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,4,power_law_1.2,8.854239654541015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,4,power_law_1.2,11.261612701416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,4,power_law_1.2,14.473356628417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,balanced,7.536474863688151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,balanced,26.194747924804688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,balanced,15.427108764648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,4,power_law_1.2,35.711019897460936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,4,power_law_1.2,0.17664639949798583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,4,power_law_1.2,0.12446080446243286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,4,power_law_1.2,0.16317440271377565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,4,power_law_1.2,0.22527360916137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,4,power_law_1.2,0.31269121170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,4,power_law_1.2,0.5267072200775147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,4,power_law_1.2,0.5657216072082519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,4,power_law_1.2,0.592409610748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,4,power_law_1.2,0.6147520065307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,balanced,12.418261210123697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,4,power_law_1.2,0.6299392223358155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,4,power_law_1.2,0.6858176231384278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,4,power_law_1.2,0.7025407791137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,4,power_law_1.2,0.7930816173553467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,4,power_law_1.2,0.7542463779449463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,4,power_law_1.2,0.7506944179534912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,4,power_law_1.2,0.819603157043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,4,power_law_1.2,0.8001152038574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,4,power_law_1.2,0.906879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,4,power_law_1.2,0.991756820678711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,4,power_law_1.2,1.140345573425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,4,power_law_1.2,1.2544575691223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,4,power_law_1.2,1.4941887855529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,4,power_law_1.2,1.7132095336914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,4,power_law_1.2,2.311635208129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,4,power_law_1.2,2.950675201416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,4,power_law_1.2,4.38856315612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,4,power_law_1.2,4.881324768066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,4,power_law_1.2,6.3421886444091795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,4,power_law_1.2,9.77533416748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,4,power_law_1.2,25.573811340332032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,balanced,26.68647003173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,4,power_law_1.2,0.17281919717788696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,4,power_law_1.2,0.11383680105209351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,4,power_law_1.2,0.15753599405288696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,balanced,0.11316266655921936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,4,power_law_1.2,0.22188799381256102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,balanced,0.15808000167210898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,4,power_law_1.2,0.29697279930114745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,balanced,0.2851840058962504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,4,power_law_1.2,0.5098688125610351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,balanced,0.5317386786142985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,balanced,1.0193013350168865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,4,power_law_1.2,0.5518911838531494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,balanced,1.2754826545715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,4,power_law_1.2,0.5849728107452392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,balanced,1.276959975560506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,4,power_law_1.2,0.6305344104766846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,balanced,1.2842293580373128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,4,power_law_1.2,0.6339839935302735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,balanced,1.2860106627146404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,4,power_law_1.2,0.6785280227661132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,balanced,1.2918506463368733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,balanced,1.295349359512329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,4,power_law_1.2,0.7078271865844726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,balanced,1.3116319974263508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,4,power_law_1.2,0.7472383975982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,balanced,1.3175360361735027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,4,power_law_1.2,0.8001791954040527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,balanced,0.07887466748555501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,balanced,1.3273653189341228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,4,power_law_1.2,0.8996607780456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,balanced,0.10599467158317566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,balanced,1.3451306025187175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,balanced,0.1646453340848287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,balanced,1.356895923614502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,balanced,0.2924746672312419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,4,power_law_1.2,0.8427647590637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,balanced,1.3847146034240723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,balanced,0.535536011060079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,balanced,1.4139679272969563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,balanced,0.6612480084101359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,4,power_law_1.2,0.8756287574768067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,balanced,0.6649226744969686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,balanced,1.447114626566569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,balanced,0.6746346950531006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,balanced,0.6811040242513021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,balanced,1.8030026753743489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,balanced,0.6857653458913168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,4,power_law_1.2,0.9407360076904296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,balanced,0.6853973070780436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.2,1.1246656417846679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,balanced,1.6149120330810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,balanced,0.6910239855448405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.2,1.2579903602600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,balanced,0.6978560288747152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,balanced,0.7084000110626221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.2,1.4673151969909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,balanced,2.635983943939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,balanced,0.7221333185831705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.2,2.012985610961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,balanced,0.7299839655558268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.01,0.1809216022491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,balanced,0.08796266714731853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.2,2.4602176666259767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,balanced,1.9676319758097331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,balanced,0.7491146723429362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.01,0.24218881130218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,balanced,0.11284266908963521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.2,3.556844711303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.01,0.11599359512329102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.01,0.22881920337677003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,balanced,0.8394933541615804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,balanced,0.1938613255818685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.01,0.40695037841796877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.2,4.303827285766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.01,0.14311039447784424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,balanced,0.2954240043958028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,balanced,0.8194719950358073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.01,0.5802688121795654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,balanced,3.1033493677775064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,balanced,0.5356800158818563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.01,0.9345664024353028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.01,0.14519040584564208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.2,6.624729919433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,balanced,1.1326026916503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,balanced,0.6635146538416544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.01,1.0330752372741698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.01,0.2355583906173706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.01,1.0682432174682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,balanced,0.669322649637858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.2,9.66333465576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.01,0.3118016004562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,balanced,0.9657546679178873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.01,1.1292223930358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,balanced,0.6757813294728597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.01,1.135807991027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.01,0.503276777267456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,balanced,0.6797813574473063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,balanced,3.283034642537435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,4,power_law_1.2,10.77391357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.01,1.1709183692932128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,balanced,1.3291467030843098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.01,0.5344064235687256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,balanced,0.6871039867401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.01,1.2722368240356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,balanced,0.6963520050048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.01,1.304966354370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.01,0.5795199871063232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,4,power_law_1.2,20.620831298828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.01,1.2654720306396485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,balanced,0.7080533504486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.01,0.6200128078460694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,balanced,1.2875466346740723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.01,1.353593635559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,balanced,0.7168479760487875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.01,0.6113024234771729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.01,1.3950783729553222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,balanced,0.7310720284779867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.01,0.6059008121490479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.01,1.406272029876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,balanced,4.791141192118327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,balanced,0.7518560091654459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.01,0.6577407836914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.01,1.5824000358581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,balanced,1.975162665049235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.01,0.686188793182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.01,1.7304576873779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,4,power_law_1.2,51.815887451171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.01,0.6853184223175048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.01,2.11596794128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.01,2.125555229187012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.01,0.7380735874176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,balanced,0.7691840330759684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.01,2.598361587524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.01,0.7663360118865967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,balanced,2.2522560755411782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.01,2.4618879318237306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.01,0.7273471832275391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.01,3.2625728607177735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.01,0.8193280220031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,balanced,6.5034027099609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.01,3.8936321258544924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.01,0.8938048362731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.01,5.244128036499023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,balanced,0.8093600273132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.01,1.0774847984313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.01,7.057369232177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,balanced,3.1346187591552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.01,1.1177920341491698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.01,8.671289825439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.01,1.3728256225585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.01,1.6174144744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.01,12.288480377197265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.01,2.0750783920288085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.01,2.5454912185668945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.01,22.53004150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,balanced,7.285845438639323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.01,3.5086719512939455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,balanced,0.9040799935658773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,balanced,4.431285222371419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.01,4.985523223876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,balanced,0.9696319897969564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,power_law_1.01,0.12373759746551513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.01,5.543302536010742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,power_law_1.01,0.1544000029563904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,balanced,1.1210880279541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,power_law_1.01,0.13647359609603882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,balanced,1.2756160100301106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.01,9.104377746582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,power_law_1.01,0.24101760387420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,power_law_1.01,0.3208832025527954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,balanced,1.82149871190389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,2,power_law_1.2,0.18277759552001954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,power_law_1.01,0.5088448047637939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.01,15.46411590576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,2,power_law_1.2,0.14057600498199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,power_law_1.01,0.5623551845550537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,2,power_law_1.2,0.1896064043045044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,power_law_1.01,0.6038335800170899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,balanced,2.1123147010803223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,balanced,5.0231679280598955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,power_law_1.01,0.6063424110412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,2,power_law_1.2,0.35481600761413573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,power_law_1.01,0.6495423793792725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,2,power_law_1.2,0.4690688133239746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,power_law_1.01,0.684223985671997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,power_law_1.01,0.6998015880584717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,balanced,3.1367839177449546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,2,power_law_1.2,0.9349696159362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,balanced,11.246528625488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,power_law_1.01,0.7526976108551026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,2,power_law_1.2,1.0375743865966798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,power_law_1.01,0.8033344268798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,power_law_1.01,0.8645503997802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,2,power_law_1.2,1.0619263648986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,2,power_law_1.2,1.1300992012023925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,balanced,4.16758918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,2,power_law_1.2,1.148908805847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,power_law_1.01,0.828217601776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,2,power_law_1.2,1.2145600318908691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,2,power_law_1.2,1.2928895950317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,power_law_1.01,0.8986623764038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,2,power_law_1.2,1.3571904182434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,2,power_law_1.2,1.3493375778198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,2,power_law_1.2,1.3485312461853027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,power_law_1.01,0.9878463745117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,balanced,5.903893152872722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,balanced,8.004213333129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,2,power_law_1.2,1.4129728317260741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,power_law_1.01,1.126425552368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,power_law_1.01,1.261580753326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,2,power_law_1.2,1.4997183799743652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,power_law_1.01,1.4949695587158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,2,power_law_1.2,1.6747520446777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,power_law_1.01,1.9565824508666991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,2,power_law_1.2,1.8555519104003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,power_law_1.01,2.5444095611572264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,2,power_law_1.2,2.233932876586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,power_law_1.01,3.5860031127929686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,2,power_law_1.2,2.183340835571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,power_law_1.01,4.55164794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,2,power_law_1.2,2.6964288711547852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,balanced,8.257845560709635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,power_law_1.01,6.95098876953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,2,power_law_1.2,2.627142333984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,2,power_law_1.2,3.435251235961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,power_law_1.01,8.738905334472657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,2,power_law_1.2,4.183039855957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,power_law_1.01,10.956224060058593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,2,power_law_1.2,5.240217590332032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,power_law_1.01,17.147039794921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,2,power_law_1.2,7.737273406982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,2,power_law_1.2,9.372710418701171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,balanced,20.52127965291341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,balanced,9.822175979614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,power_law_1.01,33.51969909667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,2,power_law_1.2,13.064895629882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,2,power_law_1.2,24.690386962890624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,balanced,15.952805836995443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,balanced,16.64421844482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,2,power_law_1.2,0.11516799926757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,2,power_law_1.2,0.08723199963569642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,2,power_law_1.2,0.1335935950279236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,2,power_law_1.2,0.201964807510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,2,power_law_1.2,0.26855039596557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,2,power_law_1.2,0.5142015933990478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,2,power_law_1.2,0.5357503890991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,2,power_law_1.2,0.5885183811187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,2,power_law_1.2,0.5929728031158448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,2,power_law_1.2,0.6137728214263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,2,power_law_1.2,0.6592959880828857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,2,power_law_1.2,0.6644927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,2,power_law_1.2,0.6976064205169678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,2,power_law_1.2,0.7044864177703858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,2,power_law_1.2,0.7284992218017579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,2,power_law_1.2,0.7771776199340821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,2,power_law_1.2,0.764185619354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,2,power_law_1.2,0.12581119537353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,2,power_law_1.2,0.8592703819274903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,2,power_law_1.2,0.09125120043754578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,2,power_law_1.2,0.9140031814575196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,balanced,33.55316925048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,2,power_law_1.2,0.1523327946662903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,balanced,0.11504532893498738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,2,power_law_1.2,1.0892864227294923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,2,power_law_1.2,0.20770559310913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,2,power_law_1.2,1.1891839981079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,balanced,0.15896532932917276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,2,power_law_1.2,0.31227519512176516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,2,power_law_1.2,0.5216447830200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,2,power_law_1.2,1.409984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,balanced,0.2877226670583089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,2,power_law_1.2,0.5590208053588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,2,power_law_1.2,1.6509376525878907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,balanced,0.5372533400853475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,2,power_law_1.2,0.592851209640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,2,power_law_1.2,2.151251220703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,balanced,1.0313546657562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,2,power_law_1.2,0.6072832107543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,2,power_law_1.2,2.502348709106445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,balanced,1.287343978881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,2,power_law_1.2,0.6321407794952393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,balanced,1.2903839747111003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,2,power_law_1.2,0.7057216167449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,2,power_law_1.2,3.6841983795166016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,balanced,1.2956586678822835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,2,power_law_1.2,0.7125760078430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,2,power_law_1.2,5.326835250854492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,balanced,1.3043893178304036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,2,power_law_1.2,0.7388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,2,power_law_1.2,0.8201855659484864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,2,power_law_1.2,6.373267364501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,balanced,1.3107733726501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,2,power_law_1.2,0.8525055885314942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,balanced,1.3166986306508381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,2,power_law_1.2,8.603916931152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,balanced,1.332682689030965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,2,power_law_1.2,0.8605888366699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,balanced,1.3487146695454915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,2,power_law_1.2,16.846354675292968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,balanced,1.3585440317789714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,balanced,1.381648063659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,2,power_law_1.2,0.9292799949645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,balanced,1.3970880508422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,balanced,1.4338453610738118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,2,power_law_1.2,1.0382656097412108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,balanced,1.7329707145690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,2,power_law_1.2,1.1778240203857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,2,power_law_1.2,1.3118016242980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,balanced,1.552768071492513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,2,power_law_1.2,1.5896703720092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,balanced,1.6648747126261394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,2,power_law_1.2,2.096339225769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,balanced,1.7955999374389648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,2,power_law_1.2,2.659686470031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,2,power_law_1.2,3.7257728576660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,balanced,2.4534719785054526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,2,power_law_1.2,4.725286483764648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,2,power_law_1.2,6.549715423583985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,balanced,2.3247040112813315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,balanced,0.08065066734949748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,2,power_law_1.2,9.216524505615235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,balanced,0.10660266876220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,balanced,0.1689280072848002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,balanced,0.29949865738550824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,balanced,4.190634727478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,2,power_law_1.2,10.979910278320313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,balanced,0.5594079891840616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,balanced,0.698362668355306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.11415679454803467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,balanced,0.706613302230835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,balanced,0.7101866404215494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,2,power_law_1.2,18.591845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.14304640293121337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,balanced,0.7118826707204183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,balanced,0.7139893372853597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.22211201190948487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,balanced,3.977936108907064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.01,0.07343999743461609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,balanced,0.7207626501719157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.38264319896697996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,balanced,0.7286400000254313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,2,power_law_1.2,36.92911376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.5590400218963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.01,0.09575679898262024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,balanced,0.7430666287740072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,balanced,0.10338133573532104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.01,0.12455040216445923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.9317952156066894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,balanced,0.7514826456705729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.01,0.22199039459228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,balanced,0.12777066230773926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.01,1.0115008354187012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,balanced,0.7648320198059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.01,0.30738561153411864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,balanced,0.18549867471059164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,balanced,0.772810697555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.01,1.0556351661682128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.01,0.514796781539917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,balanced,0.3089173237482707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,balanced,5.280645370483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,balanced,0.7985386848449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,balanced,0.5551573435465494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.01,0.5459328174591065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.01,1.116767978668213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,balanced,0.6851680278778076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,balanced,0.9452106952667236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.01,0.5791679859161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.01,1.1321727752685546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,balanced,0.6943093140920004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.01,0.5956543922424317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,balanced,0.91866668065389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.01,1.1917951583862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,balanced,0.7042346795399984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.01,0.6000383853912353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.01,0.6720704078674317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.01,1.2261631965637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,balanced,0.7130719820658366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,balanced,1.1296053727467854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.01,0.6726975917816163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,balanced,0.7210453351338705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.01,1.2562496185302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.01,0.7240896224975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,balanced,1.1599520047505696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,balanced,0.7328426837921143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.01,1.278003215789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.01,0.686624002456665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,balanced,0.7492799758911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,balanced,7.136266708374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.01,0.7174272060394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.01,1.339686393737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,balanced,1.5890560150146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,balanced,0.7630399862925211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.01,0.7535744190216065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.01,1.4017151832580566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,balanced,0.7929653326670328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.01,0.8026047706604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.01,1.4160703659057616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.01,0.908563232421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,balanced,0.836138645807902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,balanced,1.6616106033325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.01,1.5690367698669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.01,0.967033576965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.01,1.7713151931762696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.01,1.1156800270080567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.01,2.0842815399169923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.01,1.1965120315551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,balanced,2.543253262837728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.01,1.5134976387023926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.01,2.188275146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,balanced,0.8734880288441976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.01,1.85665283203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.01,2.750912094116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.01,2.4393152236938476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.01,3.1668224334716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,balanced,8.584325154622396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.01,2.9451135635375976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.01,4.39733772277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,balanced,2.943450609842936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,balanced,0.9406720002492269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.01,4.228672027587891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.01,4.3367870330810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.01,5.643603134155273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.01,6.210265731811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.01,7.0969085693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.01,8.176383972167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,balanced,4.184261322021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.01,10.796678161621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.01,10.214169311523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,balanced,1.1016053358713787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,power_law_1.01,0.1092352032661438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.01,21.26240692138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.01,15.961849975585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,balanced,1.2265493075052898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,power_law_1.01,0.13084800243377687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,power_law_1.01,0.15411200523376464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,balanced,1.506992022196452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,power_law_1.01,0.22878720760345458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.01,24.972799682617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,power_law_1.01,0.32084479331970217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,balanced,5.460224151611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,balanced,1.7845120429992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,balanced,13.941605885823568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,power_law_1.01,0.5390655994415283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,power_law_1.01,0.5613376140594483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,balanced,2.676234563191732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,power_law_1.01,0.6010176181793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,power_law_1.01,0.6218111991882325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,power_law_1.01,0.6390016078948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,balanced,3.276240030924479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,power_law_1.01,0.6882175922393798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,power_law_1.01,0.7362559795379638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,balanced,6.404314676920573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,power_law_1.01,0.7565120220184326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,balanced,4.798266728719075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,power_law_1.01,0.833625602722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,power_law_1.01,0.9421504020690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,balanced,6.37220827738444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,power_law_1.01,0.9316672325134278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.11425280570983887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,power_law_1.01,1.0196543693542481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.11877119541168213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.1938367962837219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.34729599952697754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.4719552040100098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,balanced,9.015600204467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,power_law_1.01,1.1478976249694823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.9729408264160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.01,1.326591968536377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,1,power_law_1.2,1.0003071784973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,balanced,10.7272580464681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,1,power_law_1.2,1.0669695854187011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.01,1.57838716506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,1,power_law_1.2,1.132844829559326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.01,1.914975929260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,1,power_law_1.2,1.1650752067565917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.01,2.564876747131348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,1,power_law_1.2,1.222099208831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.01,3.265760040283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,1,power_law_1.2,1.220684814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,1,power_law_1.2,1.2677824020385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,balanced,26.87535349527995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,balanced,12.108821868896484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.01,4.615827178955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,1,power_law_1.2,1.3465727806091308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,1,power_law_1.2,1.3707839965820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.01,5.936102294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,1,power_law_1.2,1.4142720222473144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,1,power_law_1.2,1.4579327583312989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.01,8.74417953491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,1,power_law_1.2,1.629849624633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,1,power_law_1.2,1.8071296691894532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,1,power_law_1.2,2.114246368408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.01,11.429459381103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,1,power_law_1.2,2.2910783767700194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,1,power_law_1.2,2.8520576477050783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.01,14.355378723144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,1,power_law_1.2,3.3950336456298826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,balanced,14.642047882080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.07845119833946228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,1,power_law_1.2,4.458284759521485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,power_law_1.01,22.755007934570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,1,power_law_1.2,4.559731292724609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.08277119994163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.12476160526275634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,1,power_law_1.2,6.30975341796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.19514240026474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,1,power_law_1.2,8.380825805664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,1,power_law_1.2,0.2663935899734497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,1,power_law_1.2,0.5032063961029053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,1,power_law_1.2,10.227999877929687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,power_law_1.01,46.67544860839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,1,power_law_1.2,0.5410367965698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,1,power_law_1.2,0.5831232070922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,1,power_law_1.2,15.837158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,1,power_law_1.2,0.6143360137939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,1,power_law_1.2,0.6436607837677002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,balanced,20.953637440999348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,1,power_law_1.2,24.94047393798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,1,power_law_1.2,0.672979211807251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,1,power_law_1.2,0.7083136081695557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,1,power_law_1.2,0.740889596939087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,1,power_law_1.2,0.7081727981567383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,balanced,24.70855458577474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,1,power_law_1.2,0.7482111930847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,1,power_law_1.2,0.7723711967468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,1,power_law_1.2,0.8164544105529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,1,power_law_1.2,0.9049216270446777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,0.9607168197631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,1.1107711791992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,1.2237119674682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,1.5418047904968262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,1.9024576187133788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,2.5094272613525392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,3.024799919128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,4.285811233520508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,5.887519836425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,1,power_law_1.2,7.235116577148437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,1,power_law_1.2,10.738304138183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,1,power_law_1.2,0.1059008002281189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,1,power_law_1.2,0.10640640258789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,1,power_law_1.2,21.27183380126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,1,power_law_1.2,0.15158400535583497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,balanced,0.10963732997576396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,1,power_law_1.2,0.20904960632324218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,balanced,0.15200000007947287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,1,power_law_1.2,0.2737407922744751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,balanced,0.2643306652704875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,1,power_law_1.2,0.5257472038269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,balanced,0.49114131927490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,1,power_law_1.2,0.5632768154144288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,balanced,49.28059387207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,balanced,0.9505013624827067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,1,power_law_1.2,0.5975872039794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,balanced,1.8510986963907878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,1,power_law_1.2,0.6254144191741944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,1,power_law_1.2,0.6756415843963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,balanced,2.7519359588623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,1,power_law_1.2,0.7102015972137451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,balanced,2.7548373540242515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,1,power_law_1.2,0.7501760005950928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,balanced,2.752511978149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,1,power_law_1.2,0.7948544025421143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,balanced,2.7707732518514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,1,power_law_1.2,0.8595840454101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,balanced,2.775146802266439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,1,power_law_1.2,0.9480768203735351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,balanced,2.783546765645345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,balanced,2.7877120971679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,balanced,2.801018714904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,1,power_law_1.2,0.9477952003479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,balanced,2.824735959370931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,balanced,2.831088066101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,1,power_law_1.2,1.0304896354675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,balanced,2.798522631327311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,balanced,2.8356641133626304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,1,power_law_1.2,1.1677760124206542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,balanced,2.9285761515299478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.2,1.3317888259887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,balanced,3.021930694580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.2,1.5902912139892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.2,1.9426240921020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,balanced,3.0694348017374673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,balanced,0.07704000174999237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.2,2.605254364013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,balanced,0.10051733255386353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,balanced,3.2011467615763345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.2,3.288294219970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,balanced,0.15954132874806723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,balanced,0.27561599016189575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.2,4.646950531005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,balanced,0.5030133326848348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,balanced,0.9596746762593588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,balanced,3.388586680094401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.2,6.033337783813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,balanced,1.4029547373453777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,balanced,1.4186347325642903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.2,8.775385284423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,balanced,1.4120853741963704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,balanced,1.416053295135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.2,11.466316986083985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,balanced,3.553173383076986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,balanced,1.4257920583089192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,balanced,1.4317439397176106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,balanced,1.433824062347412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.2,14.260986328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,balanced,1.443903923034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,balanced,1.4686773618062336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,balanced,3.854074796040853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,balanced,1.4737866719563801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,1,power_law_1.2,22.675526428222657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,balanced,1.4950453440348308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,balanced,1.53219207127889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,balanced,1.5619893074035645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,1,power_law_1.2,45.39567260742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,balanced,1.6331040064493816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,balanced,4.247658729553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,balanced,1.6801439921061199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,balanced,1.7895572980244954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,balanced,0.08931733171145122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,balanced,1.9064586957295735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.01,0.2736191987991333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,balanced,0.10969600081443787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.17863039970397948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,balanced,0.17385600010553995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.01,0.5071936130523682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,balanced,5.795509338378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.01,0.2673151969909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.01,0.9699904441833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,balanced,0.30561065673828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,balanced,2.125498612721761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.01,0.38673279285430906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,balanced,0.49906667073567706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.01,0.49750399589538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,balanced,0.9424426555633545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.01,0.7411712169647217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.01,0.20974719524383545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,balanced,1.3853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.01,1.175487995147705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.01,0.3651711940765381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.01,1.3257023811340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,balanced,1.388330618540446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,balanced,2.434826691945394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.01,1.90882568359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.01,0.5788415908813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,balanced,1.393162727355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.01,1.8948223114013671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,balanced,1.3976319630940754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.01,0.6714623928070068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.01,2.0303359985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,balanced,1.4045546849568684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.01,0.9172927856445312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.01,2.0834239959716796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,balanced,1.4132906595865886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.01,1.0027711868286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.01,2.1186496734619142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,balanced,9.529114405314127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,balanced,1.4224692980448406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.01,1.0040575981140136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.01,2.23374080657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,balanced,2.828746795654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,balanced,1.4367359479268391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.01,2.4840383529663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.01,1.0143487930297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,balanced,1.45469331741333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.01,2.612985610961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.01,1.0828479766845702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,balanced,1.4690666198730469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.01,2.7666431427001954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.01,1.139628791809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,balanced,1.49401060740153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.01,2.3596351623535154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.01,1.1760000228881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.01,2.6386112213134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,balanced,1.5511573155721028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.01,1.2035072326660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.01,3.065407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.01,1.2630911827087403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,balanced,3.699514706929525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.01,3.758047866821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.01,1.2507904052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.01,3.6241600036621096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.01,1.459449577331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,1.5432000160217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.01,4.414771270751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,balanced,1.6131253242492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,1.797216033935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.01,4.199660873413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,power_law_1.01,0.1977023959159851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,1.7162303924560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,balanced,9.960330963134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.01,5.103782272338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,power_law_1.01,0.2910271883010864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,2.118764877319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,power_law_1.01,0.5127295970916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.01,5.22215690612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,2.269811248779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,power_law_1.01,0.21875200271606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,balanced,4.6913760503133135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,4,power_law_1.2,0.29381120204925537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,power_law_1.01,0.39255681037902834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.01,6.586732482910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,2.7923391342163084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,power_law_1.01,0.610310411453247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,balanced,1.738928000132243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,4,power_law_1.2,0.48935680389404296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,3.1416704177856447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.01,8.56118392944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,power_law_1.01,0.7358528137207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,4,power_law_1.2,0.509887981414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,balanced,1.8496373494466145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,power_law_1.01,0.9083711624145507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,3.7830974578857424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,4,power_law_1.2,0.36475520133972167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.01,10.191091156005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,power_law_1.01,0.9721088409423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,4.855980682373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,power_law_1.01,1.0295616149902345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,4,power_law_1.2,0.7232895851135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,balanced,2.046501318613688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,power_law_1.01,1.082380771636963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,4,power_law_1.2,1.0578944206237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.01,13.59393310546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,power_law_1.01,1.117420768737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.01,5.960332870483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,4,power_law_1.2,1.2748800277709962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,balanced,2.2683626810709634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,power_law_1.01,1.1259008407592774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,4,power_law_1.2,1.6640447616577148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,power_law_1.01,1.2241408348083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.01,8.454329681396484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.01,31.123635864257814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,4,power_law_1.2,1.7534208297729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,power_law_1.01,1.3144831657409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,4,power_law_1.2,1.8271295547485351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,balanced,2.6521760622660318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,power_law_1.01,1.4094528198242187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,4,power_law_1.2,1.9869312286376952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.01,15.757626342773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,power_law_1.01,1.5637248039245606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,balanced,6.792405446370442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,4,power_law_1.2,2.1142976760864256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,power_law_1.01,1.824844741821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,4,power_law_1.2,2.173401641845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,balanced,3.6859680811564126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,4,power_law_1.2,2.295852851867676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.01,1.7578176498413085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,4,power_law_1.2,2.5455039978027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,4,power_law_1.2,2.658367919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,4,power_law_1.2,2.4158016204833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.01,1.7882879257202149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,balanced,4.579514821370442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,4,power_law_1.2,2.712895965576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.01,1.9979839324951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,balanced,19.189706166585285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,4,power_law_1.2,3.315756988525391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.01,2.5449024200439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.01,2.608678436279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,4,power_law_1.2,3.852588653564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.01,3.5289215087890624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,4,power_law_1.2,3.814374542236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.01,4.261433410644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,4,power_law_1.2,4.802137756347657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.01,5.922208023071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,balanced,6.447423934936523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,4,power_law_1.2,4.132467269897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.01,7.959942626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,4,power_law_1.2,5.1929473876953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,power_law_1.01,9.817183685302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,4,power_law_1.2,5.322444915771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,power_law_1.01,15.802720642089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,4,power_law_1.2,7.334989166259765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.17699840068817138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,4,power_law_1.2,10.379007720947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,4,power_law_1.2,0.26800639629364015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,power_law_1.01,31.22342529296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,balanced,8.800064086914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,4,power_law_1.2,0.26127359867095945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,balanced,13.386292775472006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,4,power_law_1.2,11.716460418701171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,4,power_law_1.2,0.23359360694885253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,4,power_law_1.2,0.3949376106262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,4,power_law_1.2,14.507066345214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,4,power_law_1.2,0.5421504020690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,4,power_law_1.2,0.6316991806030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,4,power_law_1.2,0.843718433380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,4,power_law_1.2,32.70309143066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,4,power_law_1.2,0.9317376136779785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,4,power_law_1.2,1.0095040321350097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,4,power_law_1.2,0.9784064292907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,4,power_law_1.2,1.0214079856872558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,4,power_law_1.2,1.0736512184143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,4,power_law_1.2,1.156383991241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,balanced,13.344304402669271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,4,power_law_1.2,1.2134400367736817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,4,power_law_1.2,1.293280029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,4,power_law_1.2,1.3522047996520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,4,power_law_1.2,1.4836544036865233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,1.6332096099853515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,1.93450870513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,1.8231679916381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,2.2093055725097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,2.469785690307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,3.125779151916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,3.240153503417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,4.239782333374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,5.277337646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,4,power_law_1.2,6.430847930908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,4,power_law_1.2,9.190271759033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,4,power_law_1.2,17.328250122070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,balanced,26.961878458658855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,balanced,0.11001599828402202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,balanced,0.1550826629002889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,balanced,0.2738879919052124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,balanced,0.5013333161671957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,4,power_law_1.2,0.1812608003616333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,balanced,0.988858699798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,balanced,1.8839786847432454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,4,power_law_1.2,0.2919935941696167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,4,power_law_1.2,0.24643199443817138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,balanced,2.787743886311849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,4,power_law_1.2,0.22161920070648194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,balanced,2.8864161173502603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,4,power_law_1.2,0.3997247934341431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,balanced,2.8768908182779946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,4,power_law_1.2,0.531660795211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,balanced,2.880138715108236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,4,power_law_1.2,0.5764095783233643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,balanced,0.07830933233102162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,4,power_law_1.2,0.826144027709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,balanced,2.8902133305867515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,balanced,0.10142399867375691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,4,power_law_1.2,0.9394559860229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,balanced,2.8941386540730796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,balanced,0.15762133399645487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,4,power_law_1.2,0.973363208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,balanced,2.9138879776000977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,balanced,0.27634666363398236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,4,power_law_1.2,1.0319487571716308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,balanced,0.5055253505706787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,balanced,2.843834559122721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,4,power_law_1.2,1.1511103630065918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,balanced,0.9710666338602701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,4,power_law_1.2,1.1600959777832032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,balanced,2.8645493189493814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,balanced,1.421514670054118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,balanced,1.4361440340677898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,4,power_law_1.2,1.207596778869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,balanced,2.8874667485555015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,balanced,1.4401119550069172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,4,power_law_1.2,1.3697471618652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,balanced,2.912106513977051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,balanced,1.4414186477661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,4,power_law_1.2,1.383020782470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,balanced,1.460330645243327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,4,power_law_1.2,1.598630428314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,balanced,2.956970532735189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,balanced,1.4587999979654949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,4,power_law_1.2,1.8608768463134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,balanced,1.4751520156860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,balanced,3.107189178466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,balanced,1.4778772989908855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,balanced,1.4975093205769856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,balanced,3.227663993835449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.2,1.82544002532959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,balanced,1.5121547381083171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,balanced,1.5494453112284343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,balanced,3.2647199630737305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.2,1.8605056762695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,balanced,1.5906079610188801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.2,2.121446418762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,balanced,3.441322644551595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,balanced,1.618831952412923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.2,2.716166305541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,balanced,1.6964213053385417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.2,2.894758415222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,balanced,3.6781333287556968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.01,0.1753983974456787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,balanced,1.783573309580485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.01,0.10987520217895508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.2,3.6986175537109376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.01,0.26525440216064455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.01,0.15693440437316894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.2,4.680710220336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.01,0.49407358169555665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,balanced,1.9487412770589192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.01,0.27092480659484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,balanced,4.0150346755981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.01,0.3563199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.2,7.306476593017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.01,0.21354238986968993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.01,0.6818175792694092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.01,0.39384961128234863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,balanced,2.0978506406148276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.01,1.1079423904418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.2,8.927724456787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.01,0.5974016189575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.01,1.2577792167663575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,balanced,0.11284266908963521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.01,0.6881343841552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,balanced,4.362842559814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,4,power_law_1.2,10.50780792236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.01,1.681760025024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,balanced,0.12959999839464822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.01,0.9049087524414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,balanced,2.4311307271321616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.01,1.8870527267456054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,balanced,0.19828800360361734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.01,0.9582207679748536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.01,1.843212890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,balanced,0.3322719931602478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,4,power_law_1.2,15.669471740722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,balanced,0.5170720020929972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.01,2.066655921936035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.01,0.9828864097595215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,balanced,0.9598026275634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.01,2.119712066650391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,balanced,1.4059093793233235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.01,1.0809599876403808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,balanced,2.8906561533610025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,balanced,1.4114294052124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.01,2.1856639862060545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,balanced,4.975354512532552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.01,1.0759807586669923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,4,power_law_1.2,36.550112915039065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,balanced,1.4185546239217122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.01,2.1727807998657225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,balanced,1.425872008005778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.01,1.1379199981689454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.01,2.2239999771118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,balanced,1.4376907348632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.01,1.1935359954833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.01,2.273523139953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,balanced,1.450032075246175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.01,1.276313591003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,balanced,1.462831974029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.01,2.3832447052001955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.01,1.3324864387512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,balanced,1.481514612833659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,balanced,3.502448081970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.01,2.488256072998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,balanced,1.5080533027648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.01,1.2947839736938476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.01,2.9061504364013673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,balanced,6.15943972269694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,balanced,1.5282185872395833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.01,1.4172415733337402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.01,3.168492889404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,balanced,1.582032044728597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.01,1.5784895896911622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.01,3.487315368652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.01,1.845952033996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,balanced,1.6790560086568196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.01,1.7563264846801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.01,4.450681686401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.01,2.0910720825195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.01,3.966169738769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,balanced,4.644879976908366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.01,2.184716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.01,4.621952056884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.01,2.6525312423706056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.01,5.152127838134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,balanced,1.761573314666748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.01,3.3346622467041014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,balanced,8.039386749267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.01,6.473900604248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.01,4.340339279174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.01,7.7937980651855465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.01,5.862355041503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.01,9.448966217041015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.01,7.011622619628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,balanced,6.740746815999349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.01,13.383021545410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,2,power_law_1.2,0.1764032006263733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.01,8.89660186767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,balanced,1.9646239280700684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,2,power_law_1.2,0.2655488014221191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,power_law_1.01,0.14120960235595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,2,power_law_1.2,0.2643712043762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,balanced,2.1249759991963706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,power_law_1.01,0.2009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,2,power_law_1.2,0.3597248077392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.01,31.017837524414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.01,19.401593017578126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,2,power_law_1.2,0.6655231952667237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,power_law_1.01,0.31184000968933107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,balanced,2.4550719261169434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,power_law_1.01,0.22371840476989746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,2,power_law_1.2,0.9724160194396972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,2,power_law_1.2,1.1563136100769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,power_law_1.01,0.42152957916259765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,balanced,2.859386761983236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,2,power_law_1.2,1.6623231887817382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,balanced,12.404309590657553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,power_law_1.01,0.6054719924926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,2,power_law_1.2,1.7648191452026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,2,power_law_1.2,1.8043903350830077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,power_law_1.01,0.6825664043426514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,2,power_law_1.2,1.9179136276245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,balanced,3.498965263366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,power_law_1.01,0.9230719566345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,2,power_law_1.2,2.05100154876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,power_law_1.01,0.9672896385192871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,balanced,8.160373051961264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,2,power_law_1.2,2.138483238220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,power_law_1.01,0.9805952072143554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,2,power_law_1.2,2.122336006164551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,power_law_1.01,1.0528512001037598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,balanced,5.12718931833903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,2,power_law_1.2,2.2180479049682615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,power_law_1.01,1.0996352195739747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,2,power_law_1.2,2.225324821472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,power_law_1.01,1.1485887527465821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,2,power_law_1.2,2.4446592330932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,power_law_1.01,1.230784034729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,2,power_law_1.2,2.6321407318115235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,power_law_1.01,1.3390463829040526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,2,power_law_1.2,3.083263969421387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,power_law_1.01,1.3750656127929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,2,power_law_1.2,3.4564414978027345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,balanced,6.623717625935872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,2,power_law_1.2,3.812486267089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,power_law_1.01,1.5531200408935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,2,power_law_1.2,4.588588714599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,power_law_1.01,1.8275455474853515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,2,power_law_1.2,4.175148773193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,2,power_law_1.2,5.099039840698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,power_law_1.01,1.8415872573852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,2,power_law_1.2,5.835961532592774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,2,power_law_1.2,6.769862365722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,balanced,9.008821487426758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,power_law_1.01,1.9767936706542968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,2,power_law_1.2,9.349568176269532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,power_law_1.01,2.2371776580810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,2,power_law_1.2,11.146675109863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,power_law_1.01,2.8247552871704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,power_law_1.01,3.1627519607543944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,2,power_law_1.2,14.264390563964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,power_law_1.01,4.282867050170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,balanced,22.186452229817707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,power_law_1.01,5.2497600555419925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,2,power_law_1.2,31.126641845703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,power_law_1.01,7.07080307006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,balanced,11.889354705810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,balanced,15.736309051513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,power_law_1.01,9.606150054931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,power_law_1.01,12.096749114990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,power_law_1.01,18.193209838867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,power_law_1.01,35.204531860351565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,2,power_law_1.2,0.0997439980506897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,2,power_law_1.2,0.15802240371704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,2,power_law_1.2,0.1670912027359009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,balanced,18.12707773844401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,2,power_law_1.2,0.2025279998779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,2,power_law_1.2,0.37201919555664065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,2,power_law_1.2,0.4847424030303955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,2,power_law_1.2,0.6127808094024658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,2,power_law_1.2,0.9013055801391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,2,power_law_1.2,0.8853376388549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,2,power_law_1.2,0.9572863578796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,2,power_law_1.2,0.9861568450927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,2,power_law_1.2,1.1154751777648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,2,power_law_1.2,1.1111040115356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,2,power_law_1.2,1.2344960212707519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,2,power_law_1.2,1.2941184043884277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,2,power_law_1.2,1.3219200134277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,2,power_law_1.2,1.313920021057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,2,power_law_1.2,1.4236031532287599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,2,power_law_1.2,1.5865983963012695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,2,power_law_1.2,1.9526399612426757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,2,power_law_1.2,1.915705680847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,2,power_law_1.2,2.258835220336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,2,power_law_1.2,2.33819522857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,2,power_law_1.2,2.8040128707885743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,2,power_law_1.2,3.551212692260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,balanced,0.11433066924413045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,2,power_law_1.2,4.583078384399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,balanced,0.15610667069753012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,balanced,36.32239023844401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,balanced,0.26818132400512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,2,power_law_1.2,5.877536010742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,balanced,0.5078346729278564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,2,power_law_1.2,0.1413375973701477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,balanced,0.9768479665120443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,2,power_law_1.2,6.754246520996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,2,power_law_1.2,0.19986560344696044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,balanced,1.8731199900309246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,2,power_law_1.2,0.2050368070602417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,2,power_law_1.2,9.3910400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,balanced,2.7863146464029946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,2,power_law_1.2,0.22938239574432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,balanced,2.811375935872396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,2,power_law_1.2,0.36570239067077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,2,power_law_1.2,19.61261444091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,balanced,2.8249972661336265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,2,power_law_1.2,0.526854419708252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,balanced,2.8203681310017905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,2,power_law_1.2,0.6052480220794678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,balanced,2.8236265182495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,2,power_law_1.2,0.8667712211608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,balanced,2.840357462565104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,2,power_law_1.2,0.911308765411377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,balanced,2.8542613983154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,2,power_law_1.2,0.9404288291931152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,balanced,2.8180532455444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,2,power_law_1.2,1.0428095817565919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,balanced,2.8394241333007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,2,power_law_1.2,1.0737088203430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,balanced,2.8499892552693686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,2,power_law_1.2,1.1559871673583983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,balanced,2.8823413848876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,2,power_law_1.2,1.2545984268188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,balanced,2.9534133275349936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,2,power_law_1.2,1.3121983528137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,2,power_law_1.2,1.415827178955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,balanced,3.1380640665690103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,2,power_law_1.2,1.571513557434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,balanced,3.2741225560506186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,2,power_law_1.2,1.849625587463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,balanced,3.4658454259236655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,2,power_law_1.2,1.9757440567016602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,balanced,0.08109333117802937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,balanced,3.783386548360189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,balanced,0.10399466753005981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,balanced,0.16210666298866272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,2,power_law_1.2,2.020844841003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,balanced,0.28735466798146564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,balanced,0.5277013381322225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,balanced,4.077349344889323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,2,power_law_1.2,2.292140769958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,balanced,1.006160020828247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,balanced,1.492970625559489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,2,power_law_1.2,2.926796722412109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,balanced,1.4779253005981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,balanced,1.4970614115397136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,2,power_law_1.2,3.297843170166016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,balanced,1.501962661743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,balanced,4.662970542907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,2,power_law_1.2,4.372864151000977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.10401279926300049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,balanced,0.16791999340057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,balanced,1.5185333887736003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,balanced,1.5271627108256023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.15649919509887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,balanced,0.18183465798695883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,2,power_law_1.2,5.449900817871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,balanced,1.5470666885375977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.26742401123046877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,balanced,0.23905599117279053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,balanced,1.5379360516866047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,2,power_law_1.2,7.374329376220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.3586816072463989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,balanced,0.34849599997202557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,balanced,5.262277285257976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,balanced,1.5659786860148113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,balanced,0.5509653488794962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.7026495933532715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,2,power_law_1.2,9.943641662597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,balanced,1.5714027086893718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,balanced,1.025157372156779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.01,1.0948863983154298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,balanced,1.613925298055013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,balanced,1.491685390472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.0800383985042572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,2,power_law_1.2,11.86028823852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,balanced,1.5038080215454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.01,1.3096896171569825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,balanced,1.6838560104370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.10259840488433838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,balanced,1.5142453511555989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.01,1.6982976913452148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,balanced,1.7411413192749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.15964159965515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,balanced,1.5259307225545247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,2,power_law_1.2,18.773414611816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,balanced,6.7729066212972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.01,1.8023296356201173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,balanced,1.5391359329223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.01,0.19546879529953004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,balanced,1.8906292915344238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,balanced,1.5632266998291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.01,1.8581632614135741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.01,0.3903104066848755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,balanced,1.5781973203023274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.01,1.9985279083251952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,balanced,2.07040007909139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.01,0.584012794494629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,balanced,1.6204746564229329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,2,power_law_1.2,36.5384521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.01,2.062067222595215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.01,0.6923711776733399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,balanced,1.6676747004191081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,balanced,2.3393227259318032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,balanced,1.7005653381347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.01,0.8761024475097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.01,2.14398078918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,balanced,1.7777066230773926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.01,0.9489983558654785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.01,2.1956096649169923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,balanced,1.9371466636657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,balanced,7.948752085367839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,balanced,2.559285322825114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.01,0.9783743858337403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.01,2.243596839904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.01,1.0339200019836425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.01,2.3193471908569334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.01,1.109830379486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,balanced,3.1047840118408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.01,2.440550422668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,balanced,2.100933392842611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.01,1.1300031661987304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.01,2.6299327850341796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.01,1.177030372619629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.01,2.766764831542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,balanced,3.750218709309896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.01,1.2383423805236817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.01,3.1675136566162108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.01,1.2852736473083497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.01,3.7143489837646486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,balanced,10.690799713134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.01,1.3475135803222655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.01,4.380716705322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,balanced,2.4792799949645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.01,1.5396544456481933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.01,4.0784446716308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,1.6397632598876952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,balanced,2.807450612386068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,balanced,5.131807963053386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.01,4.586073684692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,1.9798208236694337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,balanced,3.3954079945882163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.01,5.561651229858398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,2.0362688064575196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,2.449504089355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.01,7.226105499267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,2.4792448043823243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,balanced,4.0999094645182295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.01,10.378201293945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,3.0893056869506834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,3.7921985626220702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,balanced,5.8707841237386065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.01,12.37418212890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,balanced,5.343221028645833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,5.037184143066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.01,15.423443603515626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,6.442233276367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,balanced,14.77450180053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.01,7.655910491943359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,balanced,7.517391840616862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.01,33.021234130859376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.01,11.209523010253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,balanced,7.553322474161784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,power_law_1.01,0.1643455982208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.01,24.815078735351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,power_law_1.01,0.1902143955230713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,balanced,10.043733596801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,power_law_1.01,0.2489151954650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,power_law_1.01,0.2667072057723999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,power_law_1.01,0.42658557891845705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.1129472017288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,power_law_1.01,0.606873607635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.15665279626846312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.21150081157684325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,power_law_1.01,0.7258431911468506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.3315520048141479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,power_law_1.01,0.9749823570251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.6311295986175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,balanced,13.580980936686197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.9401599884033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,power_law_1.01,1.0056575775146483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,1,power_law_1.2,1.1002047538757325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,power_law_1.01,1.062342357635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,balanced,11.288992563883463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,1,power_law_1.2,1.6365184783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,power_law_1.01,1.1151040077209473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,1,power_law_1.2,1.7254720687866212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,power_law_1.01,1.1673151969909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,1,power_law_1.2,1.7940927505493165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,power_law_1.01,1.2226048469543458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,1,power_law_1.2,1.9105663299560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,power_law_1.01,1.3080960273742677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,1,power_law_1.2,2.0292863845825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,power_law_1.01,1.4246463775634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,1,power_law_1.2,2.0513792037963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,power_law_1.01,1.5392448425292968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,1,power_law_1.2,2.151238441467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,balanced,17.017920176188152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,power_law_1.01,1.6864191055297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,1,power_law_1.2,2.2242368698120116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,power_law_1.01,1.9995967864990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,1,power_law_1.2,2.293222427368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,balanced,28.49590301513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,1,power_law_1.2,2.4639232635498045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,1,power_law_1.2,2.759359931945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.01,2.0364160537719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,1,power_law_1.2,2.9473024368286134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,1,power_law_1.2,3.3288192749023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,1,power_law_1.2,3.84192008972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.01,2.3870399475097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,1,power_law_1.2,4.647635269165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.01,2.7944255828857423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,1,power_law_1.2,4.339558410644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.01,3.6759166717529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,1,power_law_1.2,5.14563217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.01,4.210323333740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,1,power_law_1.2,5.874732971191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.01,5.642822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,1,power_law_1.2,7.697408294677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,balanced,27.00707753499349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,1,power_law_1.2,10.796428680419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.01,7.15836181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.01,10.225791931152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,1,power_law_1.2,12.713689422607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,balanced,24.15057627360026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,1,power_law_1.2,15.685638427734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.01,13.401727294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.01,16.34471740722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.07991039752960205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,1,power_law_1.2,31.716433715820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.10209280252456665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,power_law_1.01,25.931231689453124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.1259392023086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,1,power_law_1.2,0.19752960205078124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,1,power_law_1.2,0.3429696083068848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,1,power_law_1.2,0.4997119903564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,power_law_1.01,50.976287841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,1,power_law_1.2,0.6168767929077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,1,power_law_1.2,0.8434559822082519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,1,power_law_1.2,0.9213503837585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,1,power_law_1.2,0.9555264472961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,1,power_law_1.2,1.013535976409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,1,power_law_1.2,1.0963135719299317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,1,power_law_1.2,1.1122112274169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,1,power_law_1.2,1.187443161010742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,1,power_law_1.2,1.2522560119628907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,1,power_law_1.2,1.3150079727172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,balanced,53.48247782389323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,1,power_law_1.2,1.4108287811279296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,1,power_law_1.2,1.615648078918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,1.7062271118164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,1.9984384536743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,balanced,0.059152002135912575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,2.155513572692871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,balanced,0.07358933488527934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,balanced,0.08264000217119853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,2.545587158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,balanced,0.0881226658821106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,balanced,0.12626133362452188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,2.598355293273926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,balanced,0.1943946679433187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,3.2030529022216796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,balanced,0.19595199823379517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,1,power_law_1.2,0.1577023983001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,balanced,0.1976213256518046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,3.9688705444335937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,1,power_law_1.2,0.19005440473556517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,balanced,0.1977120041847229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,5.294400024414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,balanced,0.19824000199635824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,1,power_law_1.2,0.2209088087081909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,balanced,0.19940799474716187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,1,power_law_1.2,0.26985599994659426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,6.561331176757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,balanced,0.21304533878962198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,1,power_law_1.2,0.38531200885772704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,balanced,0.21330666542053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,1,power_law_1.2,7.796550750732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,1,power_law_1.2,0.5355711936950683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,balanced,0.2142826716105143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,1,power_law_1.2,0.6346752166748046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,balanced,0.27028266588846844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,1,power_law_1.2,11.33201904296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,power_law_1.01,0.10474239587783814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,1,power_law_1.2,0.909727954864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,balanced,0.27137066920598346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,power_law_1.01,0.13541120290756226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,1,power_law_1.2,0.9596223831176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,balanced,0.2702346642812093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,power_law_1.01,0.09735680222511292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,balanced,0.5460373163223267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,1,power_law_1.2,0.9829695701599122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,1,power_law_1.2,24.295391845703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,power_law_1.01,0.09342719912528992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,balanced,0.5496053298314413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,1,power_law_1.2,1.089907169342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,power_law_1.01,0.11902079582214356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,balanced,0.5538133382797241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,power_law_1.01,0.12932480573654176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,1,power_law_1.2,1.18090877532959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,power_law_1.01,0.1536960005760193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,1,power_law_1.2,1.207852840423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,balanced,0.5617546637852987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,power_law_1.01,0.17503360509872437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,1,power_law_1.2,1.326483154296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,power_law_1.01,0.1662976026535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,balanced,0.5812480052312216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,1,power_law_1.2,1.4446208000183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,power_law_1.01,0.18876800537109376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,power_law_1.01,0.18272639513015748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,1,power_law_1.2,1.5343551635742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,balanced,0.6058239936828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,power_law_1.01,0.19546879529953004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,1,power_law_1.2,1.72412166595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,power_law_1.01,0.19003520011901856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,balanced,1.118016004562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,1,power_law_1.2,2.0574079513549806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,power_law_1.01,0.1965567946434021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,power_law_1.01,0.26618878841400145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,power_law_1.01,0.27929599285125734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,balanced,1.1607306798299153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,power_law_1.01,0.29052159786224363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.2,2.0921472549438476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,power_law_1.01,0.5581183910369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,power_law_1.01,0.598796796798706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,power_law_1.01,0.6672512054443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.2,2.460198402404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,balanced,1.719578742980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,power_law_1.01,0.7438975811004639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.2,2.9024127960205077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,power_law_1.01,0.9437952041625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.2,3.7481407165527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,power_law_1.01,1.1434432029724122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,4,power_law_1.2,0.10613119602203369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,balanced,2.2732747395833335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.2,4.322227096557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,balanced,0.05835733314355215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,power_law_1.01,1.4779583930969238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,4,power_law_1.2,0.12965760231018067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,power_law_1.01,1.6955839157104493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,4,power_law_1.2,0.091839998960495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.2,5.781907272338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,balanced,0.06282666822274525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,power_law_1.01,2.5345535278320312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,4,power_law_1.2,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.2,7.331084442138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,4,power_law_1.2,0.10384639501571655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,power_law_1.01,3.4161983489990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,balanced,2.855221430460612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,power_law_1.01,0.07306240200996399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,4,power_law_1.2,0.12445440292358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.2,10.408217620849609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,power_law_1.01,4.1175487518310545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,balanced,0.08710933725039165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,4,power_law_1.2,0.14162559509277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,power_law_1.01,0.09105280041694641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,balanced,0.09921600421269734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,power_law_1.01,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,power_law_1.01,6.328179168701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,4,power_law_1.2,0.16503039598464966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.2,13.367788696289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,power_law_1.01,0.09079679846763611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,balanced,0.12409067153930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,4,power_law_1.2,0.1677248001098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,power_law_1.01,0.09985920190811157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,balanced,0.1962933341662089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,power_law_1.01,12.081964874267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,4,power_law_1.2,0.16906239986419677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,power_law_1.01,0.12054400444030762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,balanced,0.19735467433929443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.2,16.373036193847657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,power_law_1.01,0.14923520088195802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,4,power_law_1.2,0.16874879598617554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,balanced,0.19985065857569376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,power_law_1.01,0.16745599508285522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,balanced,4.4928693771362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,4,power_law_1.2,0.18135039806365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,balanced,0.1996906598409017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,power_law_1.01,0.17556480169296265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,1,power_law_1.2,25.862149047851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,power_law_1.01,0.17371519804000854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,4,power_law_1.2,0.1887935996055603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,balanced,0.2007466753323873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,power_law_1.01,0.1781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,balanced,0.20195200045903525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,4,power_law_1.2,0.20273280143737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,power_law_1.01,0.17777279615402222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,balanced,0.2034026583035787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,4,power_law_1.2,0.296287989616394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,power_law_1.01,0.19333759546279908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,balanced,0.20371200640996298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,power_law_1.01,0.2147007942199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,4,power_law_1.2,0.3186431884765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,1,power_law_1.2,50.891668701171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,balanced,0.20522665977478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,power_law_1.01,0.22488958835601808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,4,power_law_1.2,0.3329087972640991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,2,power_law_1.2,0.07340800166130065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,power_law_1.01,0.22304000854492187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,balanced,0.22054932514826456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,4,power_law_1.2,0.6216127872467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,power_law_1.01,0.2510463953018188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,2,power_law_1.2,0.09068800210952759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,balanced,0.2233440081278483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,power_law_1.01,0.33968639373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,4,power_law_1.2,0.6304128170013428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,2,power_law_1.2,0.08050559759140015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,balanced,0.22595200935999551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,power_law_1.01,0.36784000396728517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,2,power_law_1.2,0.09618560075759888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,4,power_law_1.2,0.7932672023773193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,balanced,0.2871146599451701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,power_law_1.01,0.6792704105377197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,2,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,4,power_law_1.2,0.8288767814636231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,balanced,0.2906559904416402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,power_law_1.01,0.7716095924377442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,2,power_law_1.2,0.11431679725646973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,balanced,8.896421432495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,4,power_law_1.2,1.0242879867553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,power_law_1.01,0.9079999923706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,balanced,0.5898240009943644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,2,power_law_1.2,0.14960000514984131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,4,power_law_1.2,1.1982784271240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,power_law_1.01,1.0797823905944823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,2,power_law_1.2,0.15084160566329957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,balanced,0.600325345993042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,4,power_law_1.2,1.6180992126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,power_law_1.01,1.4287039756774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,2,power_law_1.2,0.16243840456008912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,balanced,0.6202720006306967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,4,power_law_1.2,2.0452415466308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,power_law_1.01,1.6308095932006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,2,power_law_1.2,0.17107839584350587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,2,power_law_1.2,0.17912960052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,4,power_law_1.2,2.846918487548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,power_law_1.01,2.4288063049316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,balanced,0.6459840138753256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,2,power_law_1.2,0.19230719804763793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,4,power_law_1.2,3.6204608917236327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,power_law_1.01,3.1587711334228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,2,power_law_1.2,0.1980288028717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,2,power_law_1.2,0.21635839939117432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,balanced,1.192032019297282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,4,power_law_1.2,4.857017517089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,power_law_1.01,3.6522495269775392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,2,power_law_1.2,0.22112638950347902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,2,power_law_1.2,0.23331840038299562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,power_law_1.01,6.107942581176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,4,power_law_1.2,7.850777435302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,2,power_law_1.2,0.2691263914108276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,balanced,1.2351946830749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,2,power_law_1.2,0.3515712022781372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,power_law_1.01,11.507596588134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,4,power_law_1.2,14.063833618164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,2,power_law_1.2,0.3960383892059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,2,power_law_1.2,0.738431978225708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,balanced,1.8292427062988281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,2,power_law_1.2,0.8627455711364747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,2,power_law_1.2,0.9560576438903808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,2,power_law_1.2,1.106067180633545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,balanced,2.4398880004882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,2,power_law_1.2,1.5237312316894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,2,power_law_1.2,1.7397951126098632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,2,power_law_1.2,2.477907180786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,balanced,0.032960000137488045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,2,power_law_1.2,3.1760639190673827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,balanced,0.04046933352947235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,balanced,3.0186986923217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,2,power_law_1.2,4.002387237548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,balanced,0.05604266623655955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,balanced,0.08853333195050557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,power_law_1.2,6.196480178833008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,balanced,0.12139200170834859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,power_law_1.2,11.616684722900391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,balanced,0.1951520045598348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,balanced,0.19563732544581094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,2,balanced,4.820650736490886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,balanced,0.19497599204381308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,balanced,0.19685333967208862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,balanced,0.19704532623291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,balanced,0.19799466927846274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,balanced,0.19897600015004477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,balanced,0.20016533136367798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,balanced,0.20336532592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,balanced,0.20496533314387003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,balanced,0.20773333311080933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,balanced,0.2116053303082784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,balanced,0.23558932542800903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,balanced,0.2437546650568644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,2,balanced,9.529808044433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,balanced,0.317413330078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,balanced,0.33210132519404095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,balanced,0.6535413265228271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,balanced,0.6837866306304932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,power_law_1.01,0.032601600885391234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,balanced,1.248949368794759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,power_law_1.01,0.040838399529457094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,power_law_1.01,0.046963199973106384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,balanced,1.312618652979533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,power_law_1.01,0.0775871992111206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,power_law_1.01,0.09327999949455261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,1,power_law_1.2,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,power_law_1.01,0.11441279649734497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,balanced,1.9271732966105144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,1,power_law_1.2,0.04097279906272888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,power_law_1.01,0.14507520198822021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,1,power_law_1.2,0.048895999789237976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,power_law_1.01,0.15211520195007325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,1,power_law_1.2,0.06871039867401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,power_law_1.01,0.16042879819869996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,1,power_law_1.2,0.08627200126647949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,power_law_1.01,0.1697983980178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,balanced,2.5490399996439614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,1,power_law_1.2,0.10670720338821411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,power_law_1.01,0.17223039865493775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,1,power_law_1.2,0.14349440336227418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,power_law_1.01,0.17500799894332886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,1,power_law_1.2,0.154310405254364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,power_law_1.01,0.1804352045059204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,1,power_law_1.2,0.15763200521469117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,power_law_1.01,0.19928959608078003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,balanced,3.188906669616699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,1,power_law_1.2,0.16370559930801393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,power_law_1.01,0.22224640846252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,1,power_law_1.2,0.1671872019767761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,power_law_1.01,0.2371135950088501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,1,power_law_1.2,0.18151040077209474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,power_law_1.01,0.26876800060272216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,1,power_law_1.2,0.18873599767684937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,power_law_1.01,0.29381120204925537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,power_law_1.01,0.34075520038604734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,1,power_law_1.2,0.2034303903579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,balanced,0.058261334896087646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,1,power_law_1.2,0.2279871940612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,power_law_1.01,0.43831682205200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,1,power_law_1.2,0.24049921035766603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,power_law_1.01,0.4934207916259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,balanced,5.061066627502441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,1,power_law_1.2,0.28575360774993896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,balanced,0.07123733560244243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,power_law_1.01,0.9273407936096192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,1,power_law_1.2,0.3020992040634155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,power_law_1.01,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,power_law_1.01,1.0797951698303223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,4,power_law_1.2,0.09178879857063293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,1,power_law_1.2,0.34798080921173097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,balanced,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,power_law_1.01,1.385478401184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,power_law_1.2,0.08546559810638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,4,power_law_1.01,0.08727679848670959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,1,power_law_1.2,0.4505023956298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,power_law_1.2,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,power_law_1.01,1.6891584396362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,4,power_law_1.01,0.09321600198745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,1,power_law_1.2,0.5241856098175048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,power_law_1.01,2.2849727630615235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,1,power_law_1.2,0.9572223663330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,balanced,0.07717866698900859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,power_law_1.01,0.07365760207176208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,1,power_law_1.2,1.1254015922546388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,power_law_1.01,2.9306751251220704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,4,power_law_1.2,0.07781760096549988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,1,power_law_1.2,1.419603157043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,power_law_1.01,3.5417728424072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,1,power_law_1.2,1.7254592895507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,balanced,0.07589333256085713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,power_law_1.01,5.421836853027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,power_law_1.01,0.07529600262641907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,4,power_law_1.2,0.07436800003051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,1,power_law_1.2,2.3604736328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,balanced,0.0830080012480418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,power_law_1.01,0.08183040022850037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,4,power_law_1.2,0.08363519906997681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,power_law_1.01,10.294707489013671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,1,power_law_1.2,2.9363712310791015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,balanced,10.020207722981771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,1,power_law_1.2,3.5978111267089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,balanced,0.08202666540940602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,power_law_1.2,0.08602880239486695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,1,power_law_1.2,5.41926383972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,4,power_law_1.01,0.0830847978591919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,balanced,0.08267733454704285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,power_law_1.2,0.09991679787635803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,4,power_law_1.01,0.08689280152320862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,balanced,0.0565226674079895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,1,power_law_1.2,10.33457260131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,balanced,0.06187733511130015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,power_law_1.2,0.11263359785079956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,balanced,0.10301333665847778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,4,power_law_1.01,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,power_law_1.2,0.11123839616775513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,balanced,0.09796266754468282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,balanced,0.0846613347530365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,4,power_law_1.01,0.11139199733734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,power_law_1.2,0.11258879899978638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,balanced,0.09813867012659709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,balanced,0.10098133484522502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,4,power_law_1.01,0.11118079423904419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,power_law_1.2,0.19527679681777954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,balanced,0.0738613357146581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,balanced,0.17864533265431723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,4,power_law_1.01,0.1909183979034424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,power_law_1.2,0.20742399692535402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,balanced,0.0843999981880188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,power_law_1.2,0.20108160972595215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,balanced,0.17915199200312296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,4,power_law_1.01,0.1860159993171692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,balanced,0.08482133348782857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,power_law_1.2,0.20769920349121093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,balanced,0.18052800496419272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,4,power_law_1.01,0.19678720235824584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,balanced,0.08499200145403545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,power_law_1.2,0.22072958946228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,power_law_1.01,0.06305919885635376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,balanced,0.17915733655293783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,4,power_law_1.01,0.21115520000457763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,balanced,0.07900266846021016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,power_law_1.2,0.27217280864715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,balanced,0.18101332585016885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,4,power_law_1.01,0.2149440050125122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,power_law_1.01,0.06647040247917176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,balanced,0.07962666451931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,power_law_1.2,0.3304768085479736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,power_law_1.01,0.08476799726486206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,power_law_1.01,0.24677760601043702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,4,balanced,0.181551992893219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,power_law_1.2,0.3496639966964722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,balanced,0.07966400186220805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,power_law_1.01,0.08358399868011475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,power_law_1.01,0.28397440910339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,4,balanced,0.1855413317680359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,power_law_1.2,0.4460159778594971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,balanced,0.10636799534161885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,balanced,0.1088746686776479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,power_law_1.2,0.6014016151428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,power_law_1.01,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,power_law_1.01,0.3527744054794312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,4,balanced,0.1886613368988037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,balanced,0.10602666934331258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,power_law_1.2,0.9416576385498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,power_law_1.01,0.08302080035209655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,power_law_1.01,0.4210495948791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,4,balanced,0.30187733968098956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,power_law_1.01,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,balanced,0.16942399740219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,power_law_1.2,1.274022388458252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,power_law_1.01,0.5804351806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,4,balanced,0.31037332614262897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,power_law_1.01,0.08375679850578308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,balanced,0.17139200369517008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,power_law_1.2,1.8466432571411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,power_law_1.01,0.7517632007598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,balanced,0.17245332400004068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,power_law_1.01,0.08985599875450134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,power_law_1.2,2.636800003051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,4,balanced,0.46927467981974286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,power_law_1.01,0.8276991844177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,balanced,0.17602133750915527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,power_law_1.01,0.08883200287818908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,power_law_1.2,3.496236801147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,power_law_1.01,1.4491711616516114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,power_law_1.01,0.10029439926147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,balanced,0.1803306738535563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,4,balanced,0.5905013481775919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,power_law_1.01,2.334835243225098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,power_law_1.2,4.981516647338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,power_law_1.01,0.11575679779052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,balanced,0.3207733432451884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,power_law_1.01,3.075187110900879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,power_law_1.01,0.11541119813919068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,power_law_1.2,5.5973247528076175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,4,balanced,0.8720959822336832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,balanced,0.33007999261220294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,power_law_1.01,0.12728320360183715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,power_law_1.01,3.4906368255615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,balanced,0.48153066635131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,power_law_1.01,0.2205440044403076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,power_law_1.2,10.292723083496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,power_law_1.01,0.21834878921508788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,4,balanced,1.1521759827931721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,power_law_1.01,5.188127899169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,balanced,0.6320373217264811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,power_law_1.01,0.2305919885635376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,power_law_1.2,21.245606994628908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,power_law_1.01,8.198770904541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,power_law_1.01,0.26922879219055174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,balanced,0.9309706687927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,power_law_1.01,0.32177278995513914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,4,balanced,1.7010186513264973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,power_law_1.01,14.754208374023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,power_law_1.01,0.4258880138397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,power_law_1.01,0.5120128154754638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,balanced,1.2259039878845215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,power_law_1.01,0.7186944007873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,power_law_1.01,0.8558655738830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,4,balanced,2.262693405151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,balanced,1.8171092669169109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,power_law_1.01,1.2401344299316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,power_law_1.01,1.583993625640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,power_law_1.01,2.3542463302612306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,4,balanced,2.8441492716471353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,balanced,2.4083733558654785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,power_law_1.01,3.3696640014648436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,power_law_1.01,4.011270523071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,power_law_1.01,6.425830078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,balanced,2.9810667037963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,power_law_1.01,12.975564575195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,4,balanced,4.521605491638184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,balanced,4.770240147908528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,4,balanced,8.884757359822592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,2,power_law_1.2,0.06468480229377746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,balanced,0.03254399945338567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,2,power_law_1.2,0.07156479954719544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,power_law_1.01,0.03187200129032135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,2,power_law_1.2,0.08470399975776673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,balanced,0.040949332217375435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,power_law_1.01,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,2,power_law_1.2,0.08193280100822449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,balanced,9.45573361714681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,2,power_law_1.2,0.07232000231742859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,power_law_1.01,0.04665600061416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,balanced,0.05442133545875549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,2,power_law_1.2,0.08258559703826904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,power_law_1.01,0.05847679972648621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,balanced,0.08577600121498108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,2,power_law_1.2,0.08369280099868774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,2,power_law_1.2,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,power_law_1.01,0.07848960161209106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,balanced,0.08081600069999695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,balanced,0.07241599758466084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,power_law_1.01,0.07087360024452209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,2,power_law_1.2,0.09212160110473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,balanced,0.07316799958546956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,power_law_1.01,0.07856000065803528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,2,power_law_1.2,0.09626240134239197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,balanced,0.0796800007422765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,power_law_1.01,0.08054400086402894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,2,power_law_1.2,0.10241919755935669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,balanced,0.07948266466458638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,power_law_1.01,0.07991039752960205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,2,power_law_1.2,0.11603200435638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,balanced,0.08014933268229167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,power_law_1.01,0.0824832022190094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,2,power_law_1.2,0.11518720388412476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,balanced,0.07934933404127757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,power_law_1.01,0.09684479832649232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,2,power_law_1.2,0.1283136010169983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,balanced,0.07830933233102162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,power_law_1.01,0.10154240131378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,2,power_law_1.2,0.2182080030441284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,balanced,0.07878399888674419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,power_law_1.01,0.10179200172424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,2,power_law_1.2,0.21971840858459474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,power_law_1.01,0.1051584005355835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,balanced,0.08014933268229167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,power_law_1.01,0.12332799434661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,2,power_law_1.2,0.2410815954208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,balanced,0.10403199990590413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,power_law_1.01,0.1395967960357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,2,power_law_1.2,0.3048255920410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,power_law_1.01,0.15397119522094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,balanced,0.1065120001633962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,power_law_1.01,0.26306560039520266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,2,power_law_1.2,0.32924799919128417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,balanced,0.10843200484911601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,power_law_1.01,0.2929984092712402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,2,power_law_1.2,0.4329023838043213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,balanced,0.18267200390497842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,power_law_1.01,0.37367680072784426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,power_law_1.01,0.45080318450927737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,2,power_law_1.2,0.47992959022521975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,balanced,0.1887306571006775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,power_law_1.01,0.6043712139129639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,2,power_law_1.2,0.6299967765808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,power_law_1.01,0.7612224102020264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,balanced,0.3391679922739665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,2,power_law_1.2,0.9022527694702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,power_law_1.01,1.0725631713867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,balanced,0.35420799255371094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,2,power_law_1.2,1.3165632247924806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,power_law_1.01,1.3913087844848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,2,power_law_1.2,1.8132352828979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,power_law_1.01,1.9956672668457032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,balanced,0.517034649848938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,balanced,0.15389333168665567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,1,power_law_1.2,0.03274880051612854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,power_law_1.01,2.630156707763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,2,power_law_1.2,2.502169609069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,balanced,0.14612799882888794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,balanced,0.68122665087382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,power_law_1.01,3.23449592590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,2,power_law_1.2,3.5311744689941404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,1,power_law_1.2,0.038553598523139956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,balanced,0.1458399991194407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,1,power_law_1.2,0.04410879909992218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,power_law_1.01,5.085625457763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,2,power_law_1.2,4.452870559692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,balanced,0.14593600233395895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,balanced,0.9940586884816488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,1,power_law_1.2,0.05601279735565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,balanced,0.14577066898345947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,2,power_law_1.2,6.55032958984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,1,power_law_1.2,0.07955200076103211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,power_law_1.01,9.98958740234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,balanced,0.1453333298365275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,1,power_law_1.2,0.07338240146636962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,balanced,1.3042720158894856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,balanced,0.14773866534233093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,1,power_law_1.2,0.07904000282287597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,2,power_law_1.2,14.344166564941407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,balanced,0.14643200238545737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,1,power_law_1.2,0.08067200183868409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,balanced,0.16180266936620077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,1,power_law_1.2,0.08106880187988282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,balanced,0.1572106679280599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,1,power_law_1.2,0.08606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,balanced,1.9188639322916667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,balanced,0.14975466330846152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,1,power_law_1.2,0.09805439710617066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,balanced,0.1525813341140747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,1,power_law_1.2,0.09692800045013428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,balanced,0.1545919974644979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,1,power_law_1.2,0.09964799880981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,balanced,0.16940265893936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,1,power_law_1.2,0.11092480421066284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,balanced,0.16881599028905234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,balanced,2.5308213233947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,balanced,0.10214933753013611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,1,power_law_1.2,0.12363519668579101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,balanced,0.17115734020868936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,balanced,0.09486400087674458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,1,power_law_1.2,0.14269440174102782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,balanced,0.1840426723162333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,balanced,0.09598933657010396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,1,power_law_1.2,0.15449600219726561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,balanced,0.2205866575241089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,balanced,0.09723200400670369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,1,power_law_1.2,0.2659327983856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,balanced,0.22401599089304605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,1,power_law_1.2,0.30352001190185546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,balanced,0.09770133097966512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,balanced,3.150090535481771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,1,power_law_1.2,0.3799360036849976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,balanced,0.0983786682287852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,balanced,0.29386667410532635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,balanced,0.09801600376764934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,1,power_law_1.2,0.44611201286315916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,balanced,0.308186670144399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,balanced,0.10075733065605164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,1,power_law_1.2,0.6044223785400391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,balanced,0.47013334433237713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,balanced,0.10129599769910176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,1,power_law_1.2,0.7603583812713623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,balanced,0.10212266445159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,1,power_law_1.2,1.080396842956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,balanced,0.5358080069224039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,balanced,0.10198400417963664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,1,power_law_1.2,1.3935232162475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,balanced,0.10073600212732951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,1,power_law_1.2,2.0029056549072264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,balanced,0.8090186913808187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,1,power_law_1.2,2.6174144744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,balanced,0.10302933057149251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,1,power_law_1.2,3.2285888671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,balanced,0.10853333274523418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,balanced,0.9321440060933431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,balanced,0.1143893301486969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,balanced,5.007178624471028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,1,power_law_1.2,5.087334442138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,balanced,0.11482133467992146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,balanced,1.3854986826578777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,balanced,0.12112533052762349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,power_law_1.2,9.987213134765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,balanced,0.14680533607800803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,balanced,0.14198399583498636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,balanced,1.8665226300557454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,balanced,0.2112320065498352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,balanced,0.20840533574422201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,balanced,0.3057813247044881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,balanced,2.3547520637512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,balanced,0.3394293387730916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.1428928017616272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,balanced,0.08754666646321614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.15016319751739501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,balanced,0.5286240180333456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,balanced,0.08718400200208028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.146560001373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,balanced,0.0869813362757365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,balanced,0.6559306780497233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,balanced,3.7487786610921225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,balanced,0.09116266171137492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,balanced,0.09083200494448344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.14666880369186402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,balanced,0.09266133109728496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,1,balanced,9.969866434733072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.14598400592803956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,balanced,0.9385759830474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,balanced,0.09451733032862346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.15580159425735474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,balanced,0.09449600179990132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.1649216055870056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,balanced,1.221781333287557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.17430399656295775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,balanced,0.09731733798980713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.23625600337982178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,balanced,0.09714667002360027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.2816319942474365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,balanced,7.612245559692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,balanced,1.5600053469340007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.25131518840789796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.01,0.29091839790344237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.01,0.3338495969772339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,balanced,0.09754133224487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.01,0.27111039161682127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,balanced,2.4043572743733725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,balanced,0.09860799709955852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.01,0.36871678829193116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,balanced,0.10033599535624187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,balanced,0.10101333260536194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.01,0.34948480129241943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.01,0.3648960113525391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.01,0.5994048118591309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.01,0.8370431900024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,balanced,4.884042739868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.01,1.2476672172546386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,balanced,0.11128532886505127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,balanced,0.11356266339619954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.01,0.9742912292480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,balanced,0.11685333649317424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.01,1.3612031936645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.01,1.7363136291503907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,balanced,0.14662399888038635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.01,3.1723968505859377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,balanced,0.15218666195869446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.01,3.8229312896728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.01,5.808422470092774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.09304959774017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,balanced,0.20053333044052124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.01,8.079942321777343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.09468799829483032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.01,10.748332977294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,power_law_1.01,0.08610560297966004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.09667840003967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,power_law_1.01,0.08657919764518737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.09626240134239197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.01,17.02574005126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,power_law_1.01,0.08856319785118102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.10056320428848267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,balanced,0.2550026575724284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.11418880224227905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,power_law_1.01,0.09062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.10490239858627319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,power_law_1.01,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.01,29.271847534179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.11239039897918701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,power_law_1.01,0.10517760515213012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,power_law_1.01,0.11215360164642334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.12744319438934326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,balanced,0.40451733271280926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,power_law_1.01,0.12738560438156127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.12092800140380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,balanced,0.4449546734491984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.13011200428009034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,power_law_1.01,0.11715840101242066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.15181440114974976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,balanced,0.6719840367635092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,power_law_1.01,0.14796160459518432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.13467520475387573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,balanced,0.8784159819285074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.1813055992126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.18619519472122192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,power_law_1.01,0.12403199672698975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,balanced,1.3266613483428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.22406399250030518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,power_law_1.01,0.13793280124664306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.01,0.32794239521026614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,power_law_1.01,0.15909119844436645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,balanced,1.7609866460164387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,0.456876802444458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,power_law_1.01,0.19274879693984986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.1374783992767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,0.7490176200866699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.14124159812927245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,0.5696576118469239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.13968000411987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,power_law_1.01,0.19874559640884398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,balanced,2.1727306048075357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,0.8221183776855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.1403712034225464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,power_law_1.01,0.23507840633392335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.14162559509277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,1.07457275390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.15301120281219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,power_law_1.01,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,1.4333824157714843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.15827200412750245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.1648576021194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,2.017932891845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,power_law_1.01,0.32987520694732664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.23546240329742432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,balanced,3.4897120793660483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,3.004755210876465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,1,8,power_law_1.2,0.2369663953781128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.01,0.5473728179931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.2520576000213623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,4.3724609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,1,8,power_law_1.2,0.3370048046112061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.01,0.716703987121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,1,8,power_law_1.2,0.3390079975128174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.01,5.808755111694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,1,8,power_law_1.2,0.2797631978988647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,1,8,power_law_1.2,0.39492480754852294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.01,9.190335845947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,1,8,power_law_1.2,0.41356801986694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.01,0.9765631675720214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,1,8,power_law_1.2,0.44023680686950684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,1,8,power_law_1.2,0.6958399772644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.01,17.218028259277343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.01,1.4201024055480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,1,8,power_law_1.2,0.8145088195800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,balanced,6.944746653238933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,1,8,power_law_1.2,1.3021439552307128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.0926144003868103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.01,1.610758399963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,1,8,power_law_1.2,0.985747241973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.09448320269584656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.01,2.3091968536376952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,1,8,power_law_1.2,1.4526016235351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,1,8,power_law_1.2,0.08622080087661743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.01,3.092492866516113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,1,8,power_law_1.2,1.9150976181030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.09591040015220642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,1,8,power_law_1.2,3.3141632080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,1,8,power_law_1.2,0.08655359745025634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.01,4.916032028198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.09619200229644775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,1,8,power_law_1.2,0.0877120018005371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,1,8,power_law_1.2,4.058451080322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.10247039794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.01,6.595532989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,1,8,power_law_1.2,0.09063040018081665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,1,8,power_law_1.2,6.3445697784423825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.11468160152435303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,1,8,power_law_1.2,0.09226239919662475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,power_law_1.01,7.724332427978515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.10696959495544434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,1,8,power_law_1.2,8.114431762695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,1,8,power_law_1.2,0.10348800420761109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.12392319440841675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,power_law_1.01,12.843923950195313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,1,8,power_law_1.2,0.1181439995765686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,1,8,power_law_1.2,10.89249267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.1217919945716858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,1,8,power_law_1.2,0.12340480089187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.1219648003578186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.1460927963256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,1,8,power_law_1.2,16.25125732421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,power_law_1.01,26.557638549804686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,1,8,power_law_1.2,0.13661439418792726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.144051194190979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,balanced,0.09310932954152425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.1338752031326294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,1,8,power_law_1.2,0.14424320459365844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.1810431957244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,balanced,0.08435733119646709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,1,8,power_law_1.2,31.05465087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.17244800329208373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,balanced,0.13915200034777322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,1,8,power_law_1.2,0.12334719896316529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.2236032009124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,balanced,0.1442506710688273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,1,8,power_law_1.2,0.13852800130844117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,1,8,power_law_1.2,0.2956415891647339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,balanced,0.14100799957911173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,1,8,power_law_1.2,0.15589760541915892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,0.5010623931884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,balanced,0.14173866311709085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,1,8,power_law_1.2,0.18508800268173217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,0.6685632228851318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,balanced,0.14113600055376688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,0.5935488224029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,balanced,0.1421280006567637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,1,8,power_law_1.2,0.18769279718399048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,0.8709247589111329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,balanced,0.14669866363207498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,1,8,power_law_1.2,0.23057920932769777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,1.0189632415771483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,balanced,0.14634133378664652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,1,8,power_law_1.2,0.29816958904266355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,1.5463295936584474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,balanced,0.14813333749771118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,1,8,power_law_1.2,0.38800640106201173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,balanced,0.15200000007947287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,2.051219177246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.2,0.5063680171966553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,balanced,0.1525973379611969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,2.9628095626831055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,balanced,0.16082666317621866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.2,0.7901631832122803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,4.692505645751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,balanced,0.17173333962758383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,1,8,power_law_1.2,5.906393432617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,balanced,0.1750133236249288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.2,0.9443136215209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,1,8,power_law_1.2,9.54369888305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,balanced,0.1846826672554016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.2,1.597267246246338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,balanced,0.06730133295059204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,balanced,0.19325333833694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,1,8,power_law_1.2,17.081529235839845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.2,1.6256256103515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,balanced,0.0621973325808843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,balanced,0.21422400077184042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.2,2.534547233581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,balanced,0.09075199564297994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,balanced,0.31596267223358154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.2,2.981088066101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,balanced,0.09325333436330159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,balanced,0.31380265951156616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,balanced,0.09408000111579895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.2,5.026156616210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,balanced,0.4485386610031128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,balanced,0.0956160028775533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.2,6.559264373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,balanced,0.09602133433024089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,balanced,0.5461973349253336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,balanced,0.09590933720270793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,1,8,power_law_1.2,8.460787200927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,balanced,0.797322670618693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,balanced,0.09684266646703084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,1,8,power_law_1.2,13.132339477539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,balanced,0.09696533282597859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,balanced,0.9851733048756918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,balanced,0.0981173316637675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,balanced,0.09966933727264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,1,8,power_law_1.2,27.288568115234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,balanced,0.10129066308339436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,balanced,1.4602932929992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,balanced,0.10709333419799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,balanced,0.11315733194351196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,balanced,1.884160041809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,balanced,0.11291199922561646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,balanced,0.11751466989517212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,balanced,0.1335093379020691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,balanced,2.343946615854899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,balanced,0.1492693324883779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,balanced,0.21128533283869425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,balanced,0.21682665745417276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.01,0.12762240171432496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,balanced,0.30369067192077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,balanced,4.185200055440267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.01,0.11593600511550903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,balanced,0.350602666536967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.01,0.11667200326919555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.01,0.14152319431304933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,balanced,0.5102773507436117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.01,0.14054399728775024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.01,0.14201600551605226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,balanced,0.6700479984283447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.01,0.1476863980293274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.01,0.15028480291366578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,balanced,0.056602666775385536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.01,0.1514431953430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,balanced,0.9691627025604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,balanced,8.120469411214193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.01,0.1793984055519104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,balanced,0.05563200016816457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.01,0.17638399600982665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,balanced,0.08335466186205547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.01,0.1902143955230713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.01,0.20500481128692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,balanced,0.08706667025883992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,balanced,1.2780799865722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.01,0.20246400833129882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,balanced,0.08683733145395915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.01,0.24492158889770507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,balanced,0.0883893370628357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.01,0.22906239032745362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.01,0.2751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,balanced,0.08998933434486389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,balanced,1.5807573000590007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.01,0.08021759986877441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.01,0.359116792678833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,balanced,0.08968533078829448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.01,0.4620800018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.01,0.07886080145835876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.01,0.47927680015563967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.01,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.01,0.6631167888641357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,power_law_1.01,0.06575999855995178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,balanced,0.09318932890892029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.01,1.1071999549865723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.01,0.0929472029209137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,power_law_1.01,0.07692800164222717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,balanced,2.624490737915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.01,1.2676671981811523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,balanced,0.0943946639696757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.01,0.0926912009716034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,power_law_1.01,0.08293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.01,2.0595136642456056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.01,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,power_law_1.01,0.0866815984249115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.01,2.7400768280029295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.01,0.09757440090179444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,power_law_1.01,0.08726400136947632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.01,0.0987712025642395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,power_law_1.01,0.09118720293045043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.01,3.8673343658447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.01,0.10190720558166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,power_law_1.01,0.09860479831695557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.01,0.10190080404281616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,power_law_1.01,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.01,5.3594623565673825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.01,0.10172159671783447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,balanced,0.09435199697812398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.01,7.616230773925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,power_law_1.01,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.01,0.1140671968460083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,balanced,0.09669867157936096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.01,0.11697280406951904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,power_law_1.01,0.12064000368118286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,balanced,5.4367415110270185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.01,8.835008239746093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,balanced,0.09796800216039021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.01,0.1368191957473755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,balanced,0.09987200299898784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.01,0.14487040042877197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,power_law_1.01,0.10854400396347046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.01,24.880044555664064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.01,0.18188799619674684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,power_law_1.01,0.11570559740066529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,power_law_1.01,0.1311360001564026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.01,0.19865599870681763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,power_law_1.01,0.15073280334472655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.01,0.2688960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.01,0.26851840019226075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,balanced,0.10920533537864685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,power_law_1.01,0.13809280395507811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.01,0.3407104015350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,balanced,0.11214400331179301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,power_law_1.01,0.15008000135421753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.01,0.4333631992340088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,balanced,0.11681066950162251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,4,power_law_1.2,0.1279360055923462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,power_law_1.01,0.2111680030822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.01,0.5825600147247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,balanced,0.1437493364016215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,power_law_1.01,0.2629184007644653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,4,power_law_1.2,0.11612800359725953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.01,0.6818751811981201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,power_law_1.01,0.3494976043701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,balanced,0.15235199530919394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.01,1.2567551612854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,4,power_law_1.2,0.12819199562072753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.01,1.6620031356811524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,4,power_law_1.2,0.14101120233535766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.01,2.5484479904174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,4,power_law_1.2,0.13852159976959227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,power_law_1.01,0.4649472236633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,balanced,0.20992533365885416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,4,power_law_1.2,0.1424512028694153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,power_law_1.01,0.7711103916168213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.01,2.886931228637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,4,power_law_1.2,0.15139199495315553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,balanced,0.2698613405227661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,4,power_law_1.2,0.150764799118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.01,4.858988952636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,4,power_law_1.2,0.1702847957611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.01,6.093235015869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,4,power_law_1.2,0.1763200044631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,power_law_1.01,1.0734592437744142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,balanced,0.41262932618459064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,4,power_law_1.2,0.1756991982460022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,power_law_1.01,1.3454336166381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,balanced,0.5472533305486044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,power_law_1.01,1.9676544189453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.01,14.536070251464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,4,power_law_1.2,0.1938688039779663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,power_law_1.01,3.0808319091796874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,4,power_law_1.2,0.2350719928741455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,balanced,0.8386240005493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,power_law_1.01,3.785939025878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,4,power_law_1.2,0.20742399692535402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,4,power_law_1.2,0.08443520069122315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,power_law_1.01,6.770169830322265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,4,power_law_1.2,0.2574016094207764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,4,power_law_1.2,0.07856640219688416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,balanced,1.1153066953023274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,4,power_law_1.2,0.08504319787025452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,4,power_law_1.2,0.28067200183868407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,power_law_1.01,7.040531158447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,4,power_law_1.2,0.09318400025367737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,4,power_law_1.2,0.2898240089416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,4,power_law_1.2,0.09276800155639649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,balanced,1.6494933764139812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,4,power_law_1.2,0.0953984022140503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,power_law_1.01,14.933477783203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,4,power_law_1.2,0.39530880451202394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,4,power_law_1.2,0.09802240133285522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,4,power_law_1.2,0.09790080189704894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,4,power_law_1.2,0.5052095890045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,4,power_law_1.2,0.10398720502853394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,balanced,2.195045312245687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,power_law_1.01,24.447410583496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,4,power_law_1.2,0.10595840215682983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,4,power_law_1.2,0.6932928085327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,4,power_law_1.2,0.10083199739456176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,4,power_law_1.2,0.6591743946075439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,4,power_law_1.2,0.1128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,4,power_law_1.2,0.9792575836181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,4,power_law_1.2,0.12012159824371338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,balanced,2.7403361002604165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,4,power_law_1.2,0.13701119422912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,4,power_law_1.2,1.4011455535888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,4,power_law_1.2,0.1598207950592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,4,power_law_1.2,2.3327232360839845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,4,power_law_1.2,0.1673087954521179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,4,power_law_1.2,0.17121920585632325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,4,power_law_1.2,2.5645503997802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,4,power_law_1.2,0.26545279026031493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,balanced,4.414005279541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,4,power_law_1.2,0.30788478851318357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,4,power_law_1.2,4.1015361785888675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,4,power_law_1.2,0.4128255844116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,4,power_law_1.2,0.5020544052124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,4,power_law_1.2,4.8543743133544925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,4,power_law_1.2,0.7208384037017822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,4,power_law_1.2,0.07162240147590637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,4,power_law_1.2,0.8871871948242187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,4,power_law_1.2,7.672249603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,4,power_law_1.2,0.07698559761047363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,4,power_law_1.2,1.1239295959472657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,4,power_law_1.2,1.6628864288330079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,4,power_law_1.2,0.08327680230140685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,4,power_law_1.2,12.633126068115235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,4,power_law_1.2,2.1387264251708986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,4,power_law_1.2,0.08613119721412658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,4,power_law_1.2,3.912211227416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,balanced,8.80734380086263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,4,power_law_1.2,0.08692479729652405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,4,power_law_1.2,17.481491088867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,4,power_law_1.2,4.073555374145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,4,power_law_1.2,0.09470080137252808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,4,power_law_1.2,6.596781158447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,4,power_law_1.2,0.09937919974327088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,4,power_law_1.2,0.11932799816131592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,4,power_law_1.2,15.222700500488282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,4,power_law_1.2,0.12325760126113891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,4,power_law_1.2,0.11536639928817749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,4,power_law_1.2,0.10856959819793702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,4,power_law_1.2,0.11628799438476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,4,power_law_1.2,0.12684799432754518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,4,power_law_1.2,0.152019202709198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,balanced,0.04781333108743032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,balanced,0.060309335589408875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,4,power_law_1.2,0.1539072036743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,balanced,0.05964266757170359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,balanced,0.08326399823029836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,4,power_law_1.2,0.15186560153961182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,balanced,0.08689066767692566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,balanced,0.137061337629954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,4,power_law_1.2,0.2224639892578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,balanced,0.09057600299517314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,4,power_law_1.2,0.25068159103393556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,balanced,0.1399893363316854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,balanced,0.09112000465393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,4,power_law_1.2,0.3580991983413696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,balanced,0.14114133516947427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,balanced,0.09166399637858073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,balanced,0.14168000221252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,balanced,0.0927946666876475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,4,power_law_1.2,0.6069375991821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,balanced,0.14265599846839905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,balanced,0.0932373305161794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,4,power_law_1.2,0.713209581375122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,balanced,0.14284267028172812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,balanced,0.09471467137336731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,balanced,0.14652799566586813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,4,power_law_1.2,1.0893568038940429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,balanced,0.09577600161234538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,balanced,0.14681599537531534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,4,power_law_1.2,1.5154815673828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,balanced,0.1493226687113444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,balanced,0.09671466549237569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,balanced,0.1542080044746399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,balanced,0.09779199957847595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,4,power_law_1.2,2.1428991317749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,balanced,0.1566933294137319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,balanced,0.09842133522033691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,4,power_law_1.2,2.633171272277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,balanced,0.10451733072598775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,balanced,0.16568533579508463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,balanced,0.112335999806722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,balanced,0.1689173380533854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,4,power_law_1.2,4.584492874145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,balanced,0.17063466707865396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,balanced,0.11353600025177002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,4,power_law_1.2,7.219526672363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,balanced,0.18609599272410074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,balanced,0.12227200468381245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,balanced,0.19476799170176187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,balanced,0.13595199584960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,4,power_law_1.2,7.860966491699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,balanced,0.2166666587193807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,balanced,0.1514400045077006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,balanced,0.2903520067532857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,4,power_law_1.2,12.366893005371093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,balanced,0.19930134216944376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,balanced,0.3202986717224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,balanced,0.23122666279474893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,balanced,0.4463733434677124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,balanced,0.3181493282318115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,4,power_law_1.2,23.521670532226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,balanced,0.5334986845652262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,balanced,0.39559467633565265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,balanced,0.7974720001220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,balanced,0.569973349571228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.01,0.07025279998779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,balanced,0.04139200101296107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,balanced,1.0159467061360676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,balanced,0.7307306925455729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.01,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,balanced,0.05336533486843109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.01,0.09679359793663025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,balanced,0.08147199948628743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,balanced,1.5121760368347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.01,0.1398848056793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,balanced,1.0586506525675456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,balanced,0.0848586658636729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.01,0.14226560592651366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,balanced,0.08578667044639587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.01,0.14513280391693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,balanced,2.0728160540262857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.01,0.15635839700698853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,balanced,1.394192059834798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,balanced,0.0869813362757365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.01,0.15447039604187013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,balanced,0.08878399928410848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.01,0.15800319910049437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,balanced,0.08877866466840108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,balanced,2.503760019938151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.01,0.1625856041908264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,balanced,1.6888906160990398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.01,0.17424639463424682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.01,0.18429440259933472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.01,0.20007040500640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.01,0.19986560344696044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,balanced,0.09020800391832988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,balanced,3.9523305892944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,balanced,2.6363040606180825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.01,0.21298561096191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,balanced,0.09102400143941243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.01,0.20719358921051026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.01,0.23082239627838136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.01,0.28354558944702146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.01,0.33588480949401855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,2,power_law_1.2,0.07641599774360656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.01,0.43546237945556643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.01,0.06116480231285095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,2,power_law_1.2,0.07642239928245545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.01,0.5096960067749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.01,0.06423680186271667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,2,power_law_1.2,0.09750400185585022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,balanced,7.79033088684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.01,0.6316351890563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,balanced,5.553754806518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,2,power_law_1.2,0.13345279693603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,balanced,0.09528000156084697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,power_law_1.01,0.05292159914970398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.01,0.0896127998828888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.01,0.8802240371704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,balanced,0.09658132990201314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,2,power_law_1.2,0.12884479761123657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,power_law_1.01,0.053465598821640016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.01,0.08982399702072144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,balanced,0.0995786686738332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.01,1.4557120323181152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,2,power_law_1.2,0.1468224048614502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,power_law_1.01,0.06234239935874939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,balanced,0.10221866766611735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.01,0.09321600198745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,2,power_law_1.2,0.1574720025062561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.01,1.5958335876464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,power_law_1.01,0.08489599823951721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.01,0.09413759708404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,2,power_law_1.2,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.01,2.5039743423461913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,power_law_1.01,0.08624640107154846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,2,power_law_1.2,0.15294719934463502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.01,3.5714431762695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.01,0.09651839733123779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,power_law_1.01,0.09146239757537841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,2,power_law_1.2,0.1646783947944641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,balanced,0.11302933096885681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.01,0.09896320104598999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.01,4.5317951202392575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,power_law_1.01,0.09408000111579895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,2,power_law_1.2,0.18321919441223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,balanced,0.11618133385976155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.01,0.09968000054359435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.01,6.145651245117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,power_law_1.01,0.09865599870681763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,balanced,0.12370666861534119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,2,power_law_1.2,0.18165119886398315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.01,0.10115840435028076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,balanced,0.15571733315785727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,2,power_law_1.2,0.18798719644546508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,balanced,0.1683573325475057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.01,0.10538239479064941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.01,14.292338562011718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,balanced,0.23259733120600382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,2,power_law_1.2,0.2096384048461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,power_law_1.01,0.1009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.01,0.1053056001663208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,balanced,0.2988640069961548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,2,power_law_1.2,0.20691840648651122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,power_law_1.01,0.10069119930267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.01,0.12484480142593384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,2,power_law_1.2,0.20877439975738527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.01,0.13834880590438842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.01,0.1329792022705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,2,power_law_1.2,0.2247551918029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,power_law_1.01,0.10216959714889526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.01,0.1526528000831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,2,power_law_1.2,0.29393279552459717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,balanced,0.48253333568573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,power_law_1.01,0.10776959657669068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.01,0.1952831983566284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,2,power_law_1.2,0.3184448003768921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,balanced,0.6366666555404663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,power_law_1.01,0.11103999614715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.01,0.2021951913833618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,2,power_law_1.2,0.4171135902404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,power_law_1.01,0.12155519723892212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.01,0.28285439014434816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,balanced,0.9481440385182699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,2,power_law_1.2,0.4364927768707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.01,0.3392640113830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,2,power_law_1.2,0.6606143951416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,balanced,1.2507839997609456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,power_law_1.01,0.13341439962387086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.01,0.4278272151947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,2,power_law_1.2,0.9438207626342774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,power_law_1.01,0.14440319538116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.01,0.6525055885314941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,2,power_law_1.2,1.3815360069274902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,power_law_1.01,0.1691007971763611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,balanced,1.866048018137614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.01,0.7982719898223877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,2,power_law_1.2,2.0024959564208986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,power_law_1.01,0.21237120628356934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.01,1.0038528442382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,2,power_law_1.2,2.893990325927734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,power_law_1.01,0.24839680194854735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.01,1.3926783561706544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,balanced,2.465365409851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,2,power_law_1.2,3.628851318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,power_law_1.01,0.35513598918914796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.01,1.930303955078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,power_law_1.01,0.5105152130126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,2,power_law_1.2,4.600172805786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.01,2.0817216873168944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,balanced,3.0869760513305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,2,power_law_1.2,5.71899528503418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,power_law_1.01,0.7643775939941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.01,4.016563034057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,power_law_1.01,0.891436767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,2,power_law_1.2,14.798483276367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,2,power_law_1.2,0.054425597190856934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.01,8.642515563964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,power_law_1.01,1.3767423629760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,2,power_law_1.2,0.059084802865982056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,balanced,4.934218724568685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,power_law_1.01,1.7607488632202148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,2,power_law_1.2,0.06716799736022949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,power_law_1.01,2.893343925476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,2,power_law_1.2,0.0927295982837677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,power_law_1.01,3.784588623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,2,power_law_1.2,0.09020159840583801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,2,power_law_1.2,0.09340800046920776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,power_law_1.01,5.222387313842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,2,power_law_1.2,0.09509119987487794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,power_law_1.01,6.589151763916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,2,power_law_1.2,0.0991424024105072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,2,power_law_1.2,0.0984063982963562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,balanced,9.970613479614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,power_law_1.01,14.673049926757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,2,power_law_1.2,0.09968640208244324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,2,power_law_1.2,0.10264960527420045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,2,power_law_1.2,0.10316159725189208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,2,power_law_1.2,0.1078976035118103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,2,power_law_1.2,0.13194880485534669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,2,power_law_1.2,0.13486720323562623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,2,power_law_1.2,0.13819520473480223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,2,power_law_1.2,0.16306560039520263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,2,power_law_1.2,0.20242559909820557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,2,power_law_1.2,0.20442240238189696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,2,power_law_1.2,0.2937727928161621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,2,power_law_1.2,0.32371199131011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,2,power_law_1.2,0.4829440116882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,2,power_law_1.2,0.5586175918579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,2,power_law_1.2,0.8258815765380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,2,power_law_1.2,1.1040384292602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,2,power_law_1.2,1.7114559173583985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,2,power_law_1.2,2.130092811584473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,2,power_law_1.2,2.602822494506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,balanced,0.05866133173306783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,balanced,0.08213333288828532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,2,power_law_1.2,4.154975891113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,balanced,0.13637866576512656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,balanced,0.1409119963645935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,2,power_law_1.2,10.247705841064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,2,power_law_1.2,0.04748159945011139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,balanced,0.14135467012723288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,balanced,0.14168000221252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,2,power_law_1.2,0.06232960224151611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,balanced,0.1432213286558787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,2,power_law_1.2,0.05935360193252563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,balanced,0.1439466675122579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,2,power_law_1.2,0.08214399814605713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,balanced,0.14800533652305603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,balanced,0.1488693356513977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,2,power_law_1.2,0.08594560027122497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,balanced,0.04065066576004028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,balanced,0.15270400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,balanced,0.1551040013631185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,2,power_law_1.2,0.09525120258331299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,balanced,0.15588800112406412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,balanced,0.05875733494758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,balanced,0.16478932897249857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,2,power_law_1.2,0.09418240189552307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,balanced,0.08700266480445862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,balanced,0.17342400550842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,2,power_law_1.2,0.09576320052146911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,balanced,0.17460266749064127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,balanced,0.0911253293355306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,balanced,0.1898720065752665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,balanced,0.09081600109736125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,balanced,0.21010667085647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,2,power_law_1.2,0.09767680168151856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,balanced,0.22547733783721924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,balanced,0.09185066819190979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,balanced,0.28777599334716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,2,power_law_1.2,0.10494719743728638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,balanced,0.0944053332010905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,balanced,0.34808532396952313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,balanced,0.09457600116729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,balanced,0.49322664737701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,balanced,0.09492799639701843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,2,power_law_1.2,0.10502400398254394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,balanced,0.09590400258700053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,balanced,0.6057066520055135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,2,power_law_1.2,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,balanced,0.09807466467221577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,2,power_law_1.2,0.11062400341033936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,balanced,0.9048746426900228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,balanced,0.09987200299898784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,2,power_law_1.2,0.13007359504699706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,balanced,0.1020906666914622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,balanced,1.1320746739705403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,balanced,0.10972799857457478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,2,power_law_1.2,0.13348480463027954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,balanced,0.11834133664766948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,2,power_law_1.2,0.14279040098190307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,balanced,0.11914666493733723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,balanced,1.6946454048156738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,2,power_law_1.2,0.1523200035095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,balanced,0.12436266740163167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,2,power_law_1.2,0.20159358978271485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,2,power_law_1.2,0.30380160808563234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,balanced,0.1586186687151591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,2,power_law_1.2,0.3819648027420044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,balanced,2.295541286468506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,balanced,0.16706132888793945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,2,power_law_1.2,0.4765183925628662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,balanced,0.21993066867192587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,2,power_law_1.2,0.9567487716674805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.0582144021987915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,balanced,0.2630186676979065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,balanced,2.8516480127970376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.06785280108451844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,2,power_law_1.2,1.013811206817627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,balanced,0.36716266473134357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.08558719754219055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,2,power_law_1.2,1.3796992301940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,balanced,0.4422080119450887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.1398975968360901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,2,power_law_1.2,2.090284729003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,balanced,0.6397013266881307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.13979519605636598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,2,power_law_1.2,3.089740753173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.1435520052909851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,balanced,4.378986676534017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,balanced,0.8322986761728922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.14655359983444213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,2,power_law_1.2,4.5515392303466795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.14707839488983154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,balanced,0.03982399900754293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.14923520088195802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,2,power_law_1.2,4.940876770019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.051583999395370485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,balanced,1.2507893244425456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.15089919567108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,balanced,0.053802669048309326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.16008960008621215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.061324799060821535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,balanced,0.08140266438325246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,2,power_law_1.2,7.5067901611328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.16402560472488403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,balanced,0.08559466401735942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.08850560188293458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.16551040410995482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,balanced,1.6580106417338054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,balanced,0.08592533071835835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.1962815999984741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,power_law_1.01,0.038822400569915774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.09010559916496277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,2,power_law_1.2,17.178009033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.20611200332641602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,balanced,0.08864532907803853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,power_law_1.01,0.04642559885978699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.09259520173072815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.20519039630889893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,balanced,0.08962666988372803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,balanced,8.609882354736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.23519361019134521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,balanced,0.09012266993522644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,balanced,2.0452906290690103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.09271680116653443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,power_law_1.01,0.05118079781532288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.2532416105270386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,power_law_1.01,0.0791808009147644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.0950655996799469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.2728895902633667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,power_law_1.01,0.08484479784965515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.09629439711570739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.33177599906921384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,power_law_1.01,0.08892800211906433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.0964031994342804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.38779520988464355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,power_law_1.01,0.09276800155639649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,balanced,3.376672108968099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,balanced,0.09257066249847412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.528985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.09832320213317872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,power_law_1.01,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.6749120235443116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,balanced,0.09482133388519287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.01,0.10241919755935669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.01,0.9259200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.10547840595245361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,power_law_1.01,0.0967296004295349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.01,1.2201536178588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.12378879785537719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,power_law_1.01,0.0995519995689392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.13346560001373292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.01,1.823756790161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.137990403175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.01,2.4012735366821287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.1401471972465515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.16855039596557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.01,3.0458047866821287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,balanced,6.239498774210612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.18611199855804444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.01,4.352979278564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.240447998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.01,8.58782730102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.0574400007724762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.2712064027786255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,balanced,0.0985599954922994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,power_law_1.01,0.10693119764328003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,0.37633280754089354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,balanced,0.10157333811124165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,power_law_1.01,0.107750403881073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,0.468339204788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.08057600259780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,balanced,0.10549867153167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,balanced,0.11034133036931355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,0.6619711875915527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.13394559621810914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,power_law_1.01,0.1091647982597351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,0.8459136009216308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.13477760553359985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,power_law_1.01,0.11981439590454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,1.2261311531066894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.14369280338287355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.14652160406112671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,1.6767168045043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,balanced,0.1237546702226003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,power_law_1.01,0.13393280506134034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.1480191946029663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.01,2.080793571472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,balanced,0.12895466883977255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.1498751997947693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,power_law_1.01,0.13515520095825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.01,3.295897674560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,balanced,0.13802666465441385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.1562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,power_law_1.01,0.15718400478363037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.01,6.109164810180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,balanced,0.18205867211023966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.15819519758224487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,power_law_1.01,0.19972480535507203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,balanced,0.2011680006980896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.16513279676437378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.01,0.23802878856658935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.16805119514465333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.01,0.3307199954986572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,balanced,0.2946453293164571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.1997056007385254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.01,0.41784958839416503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,balanced,0.38713598251342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.21171839237213136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.21086080074310304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.2364032030105591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.01,0.6154816150665283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.2522880077362061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,balanced,0.5924373467763265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.01,0.8111359596252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.2721791982650757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.01,1.1687487602233886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.3430272102355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,balanced,0.7735839684804281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.01,1.5423040390014648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.3925503969192505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,balanced,1.1497866312662761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.5383808135986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.01,2.265939140319824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.673689603805542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,balanced,1.5216800371805828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.01,2.995795249938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,1,power_law_1.2,0.9162495613098145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.01,3.7480064392089845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,1,power_law_1.2,1.1887871742248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,balanced,2.2492213249206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,power_law_1.01,5.939212799072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,1,power_law_1.2,1.8489280700683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,1,power_law_1.2,2.440339279174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,power_law_1.01,11.893721771240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,balanced,2.9838507970174155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,1,power_law_1.2,3.0333440780639647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,1,power_law_1.2,4.331103897094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,balanced,3.7347892125447593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,1,power_law_1.2,8.549152374267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,balanced,5.925301233927409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.04349440038204193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.053907197713851926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,balanced,11.993211110432943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.05751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.08762239813804626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.08891519904136658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.09214720129966736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,1,power_law_1.2,0.03746559917926788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.09352959990501404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,1,power_law_1.2,0.047353601455688475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.09544320106506347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.09613440036773682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,1,power_law_1.2,0.04912639856338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.09616000056266785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,1,power_law_1.2,0.08044800162315369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,balanced,0.14990400274594626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.10060800313949585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,balanced,0.254746675491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,1,power_law_1.2,0.08367999792098998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.10314240455627441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,balanced,0.1325226624806722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,balanced,0.22357332706451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,1,power_law_1.2,0.0868607997894287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.10446079969406127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,balanced,0.13275733590126038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,1,power_law_1.2,0.09347839951515198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,balanced,0.22266133626302084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.12684799432754518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,balanced,0.13634133338928223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,1,power_law_1.2,0.09589759707450866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,balanced,0.22240533431371054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.13784960508346558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,balanced,0.1363040010134379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,balanced,0.2220426599184672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.13905279636383056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,balanced,0.13809067010879517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,balanced,0.222378671169281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.14191360473632814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,balanced,0.13874133427937826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,1,power_law_1.2,0.09804159998893738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,balanced,0.14125866691271463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,balanced,0.222053329149882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.1651136040687561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,1,power_law_1.2,0.1014847993850708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,balanced,0.14065600434939066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.18762880563735962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,balanced,0.22604799270629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,balanced,0.14173866311709085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.2396159887313843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,balanced,0.23301867643992105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,1,power_law_1.2,0.10613759756088256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,balanced,0.1450506647427877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.2716928005218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,balanced,0.23442665735880533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,balanced,0.14384532968203226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.37484159469604494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,balanced,0.24211200078328451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,1,power_law_1.2,0.10625920295715333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,balanced,0.14615999658902487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,0.47531518936157224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,balanced,0.23592533667882284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,1,power_law_1.2,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,balanced,0.14958932995796204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,0.670630407333374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,balanced,0.2393653392791748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,1,power_law_1.2,0.12394239902496337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,balanced,0.1731520096460978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,0.8546303749084473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,balanced,0.24005866050720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,balanced,0.17645333210627237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,1.2480575561523437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,balanced,0.28853867451349896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,1,power_law_1.2,0.13462400436401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,balanced,0.17335466543833414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,balanced,0.2924373348553975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,1.659609603881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,1,power_law_1.2,0.13636480569839476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,balanced,0.20652266343434653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,balanced,0.27754666407903034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,1,power_law_1.2,2.081990432739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,1,power_law_1.2,0.1590783953666687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,balanced,0.19458667437235513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,balanced,0.3499946594238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,1,power_law_1.2,0.20760319232940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,1,power_law_1.2,3.315795135498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,balanced,0.2954079906145732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,balanced,0.29561599095662433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.2,0.23982079029083253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,1,power_law_1.2,6.130054473876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,balanced,0.29978134234746295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,balanced,0.4638400077819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.2,0.3319808006286621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,balanced,0.4599573214848836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,balanced,0.4569013516108195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.2,0.42225918769836424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,balanced,0.5761653184890747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,balanced,0.739413340886434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.2,0.6176064014434814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,balanced,0.9467679659525553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,balanced,0.8382559617360433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.2,0.8063039779663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.2,1.1771072387695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,balanced,1.4622613588968914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,balanced,0.9677600065867106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.2,1.5368255615234374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.2,2.2772159576416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,balanced,1.8754453659057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,balanced,0.14621866742769876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,balanced,1.4784746170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.2,3.0071104049682615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,balanced,0.1272586683432261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,balanced,2.854175885518392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.2,3.7329792022705077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,balanced,0.12984533111254373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,balanced,1.9617759386698406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,balanced,0.1316266655921936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,1,power_law_1.2,5.9775230407714846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,balanced,0.13190933068593344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,balanced,0.13274133205413818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,balanced,3.7225653330485025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,balanced,0.13487999637921652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,1,power_law_1.2,11.85239028930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,balanced,2.4937386512756348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,balanced,0.1348426640033722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.24270079135894776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.1490880012512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,balanced,4.722938537597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,balanced,0.14245333274205527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.2187903881072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.1322111964225769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,balanced,3.924549420674642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.21813759803771973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,balanced,0.1437493364016215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.21946239471435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.13192960023880004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.21984639167785644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.13486720323562623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.2380671977996826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,balanced,7.46671994527181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.1363584041595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.01,0.27056639194488524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.01,0.2460479974746704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.14869120121002197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.01,0.26211841106414796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.01,0.2891200065612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.16695040464401245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,balanced,0.14219733079274496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.01,0.39276158809661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.01,0.4772031784057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.14919040203094483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,balanced,0.14363200465838113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.01,0.49672961235046387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,balanced,7.7559254964192705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.16432640552520753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.01,0.4852799892425537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,balanced,0.14613866806030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.1766144037246704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.01,0.543455982208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,balanced,0.1471466620763143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.1583680033683777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.01,0.6707136154174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.01,0.19098880290985107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.01,0.4821887969970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,balanced,15.426085154215494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.01,0.170796799659729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.01,0.732147216796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.01,0.8054080009460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.2546112060546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.01,1.2370559692382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.01,0.3615679979324341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,power_law_1.01,0.13878400325775148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,balanced,0.15940266847610474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.01,1.329798412322998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.01,0.3300159931182861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,power_law_1.01,0.12730239629745482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.01,1.9703359603881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,balanced,0.16207999984423319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.01,0.31811840534210206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,power_law_1.01,0.12752000093460084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.01,3.1987199783325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,balanced,0.16553599635759988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.01,0.45462398529052733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,power_law_1.01,0.1309056043624878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.01,5.21655044555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,0.43880319595336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,power_law_1.01,0.1316864013671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.01,6.888697814941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,power_law_1.01,0.15538560152053832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,0.6293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,balanced,0.2071946660677592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,0.8499775886535644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,power_law_1.01,0.17929600477218627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.01,14.946304321289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,balanced,0.217466672261556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,1.2552255630493163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,power_law_1.01,0.1832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.01,14.317893981933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,1.6808895111083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,power_law_1.01,0.20393600463867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,2.6075136184692385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.01,14.360243225097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,power_law_1.01,0.20341119766235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,balanced,0.3225119908650716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,3.468288040161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,5.587615966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.01,27.991802978515626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,balanced,0.4097919861475627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,power_law_1.01,0.17727359533309936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,balanced,0.6169813474019369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,6.7225341796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,power_law_1.01,0.23170559406280516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,power_law_1.01,0.22093439102172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.01,8.261427307128907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,balanced,0.6612853209177653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,power_law_1.01,0.298854398727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.01,58.72930908203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.01,13.694117736816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,power_law_1.01,0.3148672103881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,power_law_1.01,0.2999808073043823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,balanced,1.0734079678853352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.01,27.8715576171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,power_law_1.01,0.42143998146057127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,balanced,1.3251307010650635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,power_law_1.01,0.48534398078918456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.01,0.7854656219482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,balanced,1.9823466936747234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.01,1.1713855743408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.24065918922424318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.01,1.5257344245910645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.2183295965194702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,balanced,2.6122719446818032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.21767680644989013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.01,2.3870847702026365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.2194432020187378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.22018558979034425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.01,2.326246452331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.2344831943511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,balanced,3.2522185643514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,1,8,power_law_1.2,0.26961920261383054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,1,8,power_law_1.2,0.24952321052551268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.01,4.224550247192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,1,8,power_law_1.2,0.27239038944244387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,1,8,power_law_1.2,0.2963648080825806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.01,4.485657501220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,1,8,power_law_1.2,0.36033918857574465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,1,8,power_law_1.2,0.48974080085754396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.01,7.631961822509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,balanced,5.271317481994629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,1,8,power_law_1.2,0.5647232055664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,1,8,power_law_1.2,0.4645376205444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.01,10.107520294189452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,1,8,power_law_1.2,0.5193344116210937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,1,8,power_law_1.2,0.6979904174804688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,1,8,power_law_1.2,0.526585578918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,power_law_1.01,12.44571533203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,1,8,power_law_1.2,0.7308735847473145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,1,8,power_law_1.2,0.8341376304626464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,power_law_1.01,19.749177551269533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,1,8,power_law_1.2,1.0646016120910644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,1,8,power_law_1.2,1.3745408058166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,1,8,power_law_1.2,2.1071359634399416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,balanced,10.534063975016275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,1,8,power_law_1.2,3.303788757324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.13200000524520875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,1,8,power_law_1.2,5.378521728515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,power_law_1.01,39.855859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.1315392017364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.13498879671096803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,1,8,power_law_1.2,8.779539489746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.13603199720382692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,1,8,power_law_1.2,13.684019470214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.1561535954475403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.19160959720611573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,1,8,power_law_1.2,14.344345092773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.14877439737319947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.17163519859313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,1,8,power_law_1.2,17.520358276367187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.19333759546279908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,1,8,power_law_1.2,0.12702720165252684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.16535040140151977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,1,8,power_law_1.2,26.092941284179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,1,8,power_law_1.2,0.127455997467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.1915519952774048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,balanced,0.1491146683692932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,1,8,power_law_1.2,0.12767360210418702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,1,8,power_law_1.2,0.2021631956100464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,1,8,power_law_1.2,0.1308351993560791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,balanced,0.12174933155377705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.2540479898452759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,1,8,power_law_1.2,0.13257600069046022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,1,8,power_law_1.2,0.31763200759887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,1,8,power_law_1.2,60.4158447265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,1,8,power_law_1.2,0.14995839595794677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,balanced,0.23363200823465982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,1,8,power_law_1.2,0.3746880054473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,1,8,power_law_1.2,0.17900799512863158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,balanced,0.22984000047047934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,1,8,power_law_1.2,0.3107968091964722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,1,8,power_law_1.2,0.21397120952606202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,1,8,power_law_1.2,0.4586751937866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,balanced,0.22454933325449625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,1,8,power_law_1.2,0.20400640964508057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,0.4442304134368896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,0.7162816047668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,balanced,0.22504534324010214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,1,8,power_law_1.2,0.21629440784454346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,balanced,0.22669333219528198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,0.8353599548339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,balanced,0.2275200088818868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,1.2667584419250488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,1,8,power_law_1.2,0.17842559814453124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,balanced,0.2341973384221395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,1.7535680770874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,1,8,power_law_1.2,0.1909824013710022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,balanced,0.23864533503850302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,2.475347137451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,1,8,power_law_1.2,0.2452672004699707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,balanced,0.23996265729268393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,3.4694271087646484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,1,8,power_law_1.2,0.2996288061141968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,balanced,0.24310932556788126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,5.294598388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,balanced,0.24569066365559897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,balanced,0.2564319968223572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,7.01812515258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,1,8,power_law_1.2,0.2940671920776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,balanced,0.2715733249982198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,balanced,0.273525337378184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,1,8,power_law_1.2,8.167648315429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,1,8,power_law_1.2,0.3260479927062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,balanced,0.27356799443562824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,1,8,power_law_1.2,0.4256896018981934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,balanced,0.32314666112263996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,1,8,power_law_1.2,14.065023803710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,balanced,0.30185600121816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,balanced,0.09215999643007915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,1,8,power_law_1.2,0.5474815845489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,balanced,0.4339199860890706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,balanced,0.08346666892369588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.2,0.7184512138366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,balanced,0.13221333424250284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,balanced,0.4812320073445638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,1,8,power_law_1.2,26.514834594726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,balanced,0.13546666502952576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.2,1.2449983596801757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,balanced,0.6874667008717855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,balanced,0.1339466671148936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,balanced,0.1357493301232656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.2,1.4232576370239258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,balanced,0.8067146937052408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,balanced,0.13638933499654135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.2,2.458367919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,balanced,0.13782933354377747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,balanced,0.13776533802350363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.2,2.3599424362182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,balanced,1.2030666669209797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,balanced,0.14378666877746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,balanced,0.14056533575057983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,balanced,0.14198933045069376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,balanced,1.587813377380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.2,4.0891777038574215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,balanced,0.14826666315396628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,balanced,0.0839466651280721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,balanced,0.14797332882881165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.2,3.9649280548095702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,balanced,0.16411200165748596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,balanced,0.07550399998823802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,balanced,2.4384427070617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,balanced,0.16618133584658304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.2,7.684754943847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,balanced,0.1665173371632894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,balanced,0.12429333726565044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,balanced,0.1930560072263082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,balanced,0.12818132837613425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,balanced,0.20085332791010538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.2,9.845734405517579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,balanced,0.1285813351472219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,balanced,3.568661371866862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,balanced,0.280623992284139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,balanced,0.13040533661842346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,1,8,power_law_1.2,12.254713439941407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,balanced,0.31755733489990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,balanced,0.13242666920026144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,balanced,0.43989332516988117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,balanced,0.13286399841308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,1,8,power_law_1.2,20.848857116699218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,balanced,0.5342559814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,balanced,4.399077415466309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,balanced,0.7904799779256185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,balanced,1.0023039976755779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,1,8,power_law_1.2,40.377297973632814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,balanced,0.13268799583117166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,balanced,0.13403200109799704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,balanced,1.4988853136698406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,balanced,7.4933013916015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.01,0.11493120193481446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.01,0.2095168113708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.01,0.13169280290603638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,balanced,1.9442453384399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.01,0.13182719945907592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.01,0.18148479461669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.01,0.1674239993095398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.01,0.13456640243530274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.01,0.22535040378570556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,balanced,2.4428319931030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.01,0.1329856038093567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,balanced,0.13788800438245138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.01,0.22459518909454346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.01,0.13638399839401244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.01,0.23916161060333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,balanced,0.1400213340918223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.01,0.1472640037536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.01,0.24469759464263915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,balanced,14.204580942789713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,balanced,0.1423786679903666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.01,0.2510783910751343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.01,0.14495359659194945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,balanced,4.405317306518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.01,0.2585472106933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,balanced,0.14526933431625366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.01,0.15716480016708373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.01,0.2637824058532715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.01,0.15306240320205688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.01,0.27511680126190186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.01,0.1571903944015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.01,0.29690239429473875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.01,0.1686784029006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.01,0.1843840003013611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.01,0.3215487957000732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,balanced,0.1569813291231791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.01,0.2165247917175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.01,0.3329792022705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,balanced,0.16074666380882263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.01,0.25189120769500734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.01,0.3569279909133911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,balanced,0.16597867012023926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.01,0.2894464015960693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,power_law_1.01,0.10655360221862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.01,0.38314878940582275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,balanced,8.051712036132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,balanced,0.21223467588424683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.01,0.30665600299835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.01,0.37512319087982177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,power_law_1.01,0.11507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,balanced,0.22472532590230307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.01,0.40590081214904783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.01,0.5994304180145263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,power_law_1.01,0.12398079633712769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,balanced,0.32185065746307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.01,0.35365118980407717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,power_law_1.01,0.11857279539108276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.01,0.5606336116790771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,balanced,0.4211680094401042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.01,0.43831682205200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,power_law_1.01,0.12893439531326295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.01,0.796288013458252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.01,0.5753407955169678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,power_law_1.01,0.15505919456481934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.01,1.186355209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,power_law_1.01,0.15614720582962036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.01,0.9467840194702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.01,1.534182357788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,power_law_1.01,0.1686336040496826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.01,1.277945613861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.01,2.0132543563842775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,balanced,0.6352213223775228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.01,1.7236352920532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.01,3.6111167907714843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.01,2.8620607376098635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,balanced,0.8599627017974854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,power_law_1.01,0.15693440437316894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.01,4.070240020751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,power_law_1.01,0.17775360345840455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.01,4.02279052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.01,6.721465301513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,balanced,1.309162696202596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.01,5.522137451171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.01,7.912601470947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,power_law_1.01,0.1595199942588806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,balanced,1.7238772710164387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.01,5.87336311340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.01,10.052703857421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,power_law_1.01,0.18336639404296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.01,10.837107086181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,power_law_1.01,0.18434560298919678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,balanced,2.568186601003011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.01,16.286029052734374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,power_law_1.01,0.22008960247039794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,4,power_law_1.2,0.22942719459533692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.01,21.969842529296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,power_law_1.01,0.2133375883102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,4,power_law_1.2,0.2014143943786621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,balanced,3.429621378580729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,power_law_1.01,0.2171776056289673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,4,power_law_1.2,0.20793600082397462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.01,43.576596069335935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,power_law_1.01,0.2774784088134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,4,power_law_1.2,0.22585599422454833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,power_law_1.01,0.39661440849304197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,balanced,4.286527951558431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,4,power_law_1.2,0.22421119213104249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,power_law_1.01,0.5304255962371827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,4,power_law_1.2,0.23276159763336182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,power_law_1.01,0.8545984268188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,4,power_law_1.2,0.249017596244812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,power_law_1.01,1.0580479621887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,4,power_law_1.2,0.25013759136199953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,balanced,6.931360244750977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,4,power_law_1.2,0.2571007966995239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,power_law_1.01,1.617363166809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,4,power_law_1.2,0.2777024030685425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,power_law_1.01,1.8941951751708985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,4,power_law_1.2,0.27946879863739016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,4,power_law_1.2,0.2842112064361572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,power_law_1.01,3.0685056686401366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,4,power_law_1.2,0.33534080982208253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,power_law_1.01,3.2732864379882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,4,power_law_1.2,0.31639680862426756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,4,power_law_1.2,0.3910207986831665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,power_law_1.01,7.309056091308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,4,power_law_1.2,0.37387518882751464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,balanced,14.448277791341146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,4,power_law_1.2,0.3931328058242798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,power_law_1.01,8.35396499633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,4,power_law_1.2,0.5451263904571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,power_law_1.01,10.30574722290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,4,power_law_1.2,0.6477888107299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,4,power_law_1.2,0.9058624267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,4,power_law_1.2,0.13343360424041747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,power_law_1.01,24.355314636230467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,4,power_law_1.2,1.032313632965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,4,power_law_1.2,0.1219648003578186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,4,power_law_1.2,1.4960448265075683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,4,power_law_1.2,0.11192320585250855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,4,power_law_1.2,0.13486080169677733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,4,power_law_1.2,2.325766372680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,4,power_law_1.2,0.13316479921340943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,4,power_law_1.2,0.13671679496765138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,power_law_1.01,40.514251708984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,4,power_law_1.2,3.6094913482666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,4,power_law_1.2,0.15960320234298705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,4,power_law_1.2,0.14839680194854737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,4,power_law_1.2,3.498444747924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,4,power_law_1.2,0.14920320510864257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,4,power_law_1.2,0.1647487998008728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,4,power_law_1.2,5.216928100585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,4,power_law_1.2,0.15912959575653077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,4,power_law_1.2,0.17384320497512817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,4,power_law_1.2,8.60271987915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,4,power_law_1.2,0.18215680122375488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,4,power_law_1.2,0.11882239580154419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,4,power_law_1.2,0.20166399478912353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,4,power_law_1.2,12.841107177734376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,4,power_law_1.2,0.2734783887863159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,4,power_law_1.2,0.1260607957839966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,4,power_law_1.2,0.2774847984313965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,4,power_law_1.2,0.12584960460662842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,4,power_law_1.2,0.3426176071166992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,4,power_law_1.2,22.681805419921876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,4,power_law_1.2,0.12942080497741698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,balanced,0.09177600344022115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,4,power_law_1.2,0.4400767803192139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,4,power_law_1.2,0.36728320121765134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,4,power_law_1.2,0.13020800352096557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,balanced,0.12402666608492534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,4,power_law_1.2,0.4635903835296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,4,power_law_1.2,0.1461824059486389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,4,power_law_1.2,0.5918208122253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,balanced,0.21985065937042236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,4,power_law_1.2,0.15478399991989136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,4,power_law_1.2,0.9378047943115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,4,power_law_1.2,45.30760192871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,balanced,0.22219733397165933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,4,power_law_1.2,1.2601344108581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,4,power_law_1.2,0.17647360563278197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,balanced,0.2217280069986979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,4,power_law_1.2,2.2259199142456056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,balanced,0.22242132822672525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,4,power_law_1.2,2.63504638671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,balanced,0.22381333510080972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,4,power_law_1.2,0.1678655982017517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,4,power_law_1.2,4.960467147827148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,balanced,0.22632533311843872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,4,power_law_1.2,0.18658560514450073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,4,power_law_1.2,6.579161834716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,balanced,0.22917866706848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,4,power_law_1.2,7.502861022949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,balanced,0.23004267613093057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,4,power_law_1.2,0.1637887954711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,balanced,0.23611734310785928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,4,power_law_1.2,11.877510070800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,4,power_law_1.2,0.1764672040939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,balanced,0.23864533503850302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,4,power_law_1.2,0.19039360284805298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,balanced,0.2399253249168396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,4,power_law_1.2,22.564102172851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,4,power_law_1.2,0.2065216064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,balanced,0.2518986662228902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,balanced,0.26057066520055133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,4,power_law_1.2,0.216428804397583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,balanced,0.2609013319015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,4,power_law_1.2,0.24931840896606444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,balanced,0.2827039957046509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,4,power_law_1.2,0.31383678913116453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,balanced,0.31090132395426434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,4,power_law_1.2,0.4768511772155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,balanced,0.3254133264223735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,balanced,0.421066681543986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,4,power_law_1.2,0.5971263885498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,balanced,0.055674667159716286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,balanced,0.4790613253911336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,4,power_law_1.2,1.076748752593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,balanced,0.07962133487065633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,balanced,0.6870293617248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,4,power_law_1.2,1.3134464263916015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,balanced,0.12846400340398154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,balanced,0.8596426645914713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,balanced,0.13133866588274637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,balanced,0.1322879989941915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,4,power_law_1.2,1.9181568145751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,balanced,1.2621546586354573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,balanced,0.13359999656677246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,4,power_law_1.2,2.653568077087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,balanced,0.13487466176350912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,balanced,0.13546666502952576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,balanced,1.6327093442281086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,4,power_law_1.2,2.922643280029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,balanced,0.13732266426086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,balanced,0.13834666212399802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,4,power_law_1.2,5.596582412719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,balanced,0.14085333546002707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,balanced,0.05467733244101206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,balanced,2.4521279335021973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,balanced,0.1420799990495046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,4,power_law_1.2,6.640480041503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,balanced,0.14455999930699667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,balanced,0.07422400017579396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,balanced,0.15254933635393778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,balanced,0.1227946678797404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,balanced,0.16114667057991028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,4,power_law_1.2,10.72533721923828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,balanced,0.1653439998626709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,balanced,3.473818778991699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,balanced,0.1264906624952952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,balanced,0.17866667111714682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,4,power_law_1.2,9.962598419189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,balanced,0.12668800354003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,balanced,0.2019466757774353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,balanced,0.12847466270128885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,balanced,0.2141866683959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,balanced,0.13115732868512472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,balanced,4.315888086954753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.01,0.11311999559402466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,balanced,0.27854933341344196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,4,power_law_1.2,25.40558776855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,balanced,0.13065600395202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,balanced,0.31706132491429645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.01,0.1457856059074402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.01,0.16826879978179932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,balanced,0.4502986669540405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.01,0.2130176067352295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,balanced,0.5710506836573283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.01,0.22082560062408446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,balanced,6.475823720296224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,balanced,0.13333866993586221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.01,0.22447359561920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,4,power_law_1.2,58.66658325195313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,balanced,0.8212479750315348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.01,0.23420159816741942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,balanced,0.13487466176350912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,balanced,1.1132960319519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.01,0.23495039939880372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.01,0.2521087884902954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,balanced,1.6252214113871257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.01,0.2511552095413208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.01,0.26338560581207277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.01,0.2867455959320068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,balanced,2.1829706827799478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.01,0.31134719848632814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,balanced,12.977269490559896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,balanced,0.14006933569908142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.01,0.2876863956451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,balanced,0.14289599657058716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.01,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,balanced,2.6976747512817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.01,0.31198720932006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,balanced,0.14641066392262778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.01,0.0796992003917694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,balanced,0.15068800250689188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.01,0.31589760780334475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.01,0.10046720504760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.01,0.3643903970718384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.01,0.13096319437026976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.01,0.42797441482543946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,balanced,4.176650683085124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.01,0.13141759634017944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.01,0.5182208061218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,balanced,0.16454399625460306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.01,0.1336832046508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.01,0.6030144214630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,balanced,0.16859199603398642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.01,0.7517055988311767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,balanced,0.17780800660451254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.01,0.1393280029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.01,1.0432000160217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,balanced,0.2304906646410624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.01,0.14253439903259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.01,1.365708827972412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,balanced,0.2450559933980306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.01,0.13868800401687623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,power_law_1.01,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.01,1.7154943466186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,balanced,8.163824081420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.01,0.14691200256347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,power_law_1.01,0.08414080142974853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.01,2.8213504791259765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.01,0.1546496033668518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,power_law_1.01,0.08572160005569458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.01,0.15340800285339357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.01,3.9375038146972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,balanced,0.35658665498097736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,power_law_1.01,0.12611839771270753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.01,0.18356479406356813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,power_law_1.01,0.12683520317077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.01,5.72113265991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,balanced,0.48519468307495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.01,0.1952831983566284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,power_law_1.01,0.13392640352249147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.01,5.65973129272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.01,0.20310399532318116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,balanced,0.7367306550343832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,power_law_1.01,0.13827199935913087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.01,0.22070400714874266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.01,9.520941162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,power_law_1.01,0.1518720030784607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,balanced,0.9785866737365723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.01,0.28263039588928224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.01,0.2902911901473999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,balanced,1.4652160008748372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.01,21.63304901123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.01,0.36732161045074463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,power_law_1.01,0.156876802444458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,2,power_law_1.2,0.13419519662857055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,balanced,1.9280053774515789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.01,0.46314239501953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,2,power_law_1.2,0.1343168020248413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,power_law_1.01,0.16017919778823853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,2,power_law_1.2,0.15641599893569946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.01,0.6724287986755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,2,power_law_1.2,0.2133631944656372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,2,power_law_1.2,0.22085120677947997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.01,0.854969596862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,balanced,2.8826611836751304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,power_law_1.01,0.15356160402297975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,2,power_law_1.2,0.22607998847961425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.01,1.2726400375366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,2,power_law_1.2,0.23331840038299562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,power_law_1.01,0.15660159587860106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,2,power_law_1.2,0.23523199558258057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.01,1.73187198638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,power_law_1.01,0.17089920043945311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,2,power_law_1.2,0.24775679111480714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,balanced,3.832325299580892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.01,2.4909055709838865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,2,power_law_1.2,0.24871680736541749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,power_law_1.01,0.1915711998939514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,2,power_law_1.2,0.2736959934234619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.01,3.422515106201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,2,power_law_1.2,0.2764607906341553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,power_law_1.01,0.19531519412994386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.01,4.326752090454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,2,power_law_1.2,0.3001919984817505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,balanced,4.806885401407878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,2,power_law_1.2,0.2900799989700317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,power_law_1.01,0.2082495927810669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,2,power_law_1.2,0.30628480911254885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.01,6.684774780273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,power_law_1.01,0.23363199234008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,2,power_law_1.2,0.3228480100631714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,2,power_law_1.2,0.3726975917816162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,power_law_1.01,0.31642239093780516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.01,11.826419067382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,2,power_law_1.2,0.42142720222473146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,power_law_1.01,0.3434880018234253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,2,power_law_1.2,0.5031040191650391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,balanced,7.755434672037761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,2,power_law_1.2,0.5583295822143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,power_law_1.01,0.5040575981140136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,2,power_law_1.2,0.739244794845581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,power_law_1.01,0.7885119915008545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,2,power_law_1.2,0.9979776382446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,power_law_1.01,1.154636764526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,2,power_law_1.2,1.6286399841308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,2,power_law_1.2,2.2141632080078124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,power_law_1.01,1.4949055671691895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,2,power_law_1.2,2.9468671798706056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,power_law_1.01,2.4040576934814455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,2,power_law_1.2,4.335782241821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,power_law_1.01,2.8888832092285157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,2,power_law_1.2,6.1007232666015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,balanced,16.127727508544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,power_law_1.01,4.80516471862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,2,power_law_1.2,7.39658203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,power_law_1.01,5.921030426025391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,2,power_law_1.2,10.112793731689454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,power_law_1.01,8.204544067382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,2,power_law_1.2,22.825363159179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,power_law_1.01,11.117241668701173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,2,power_law_1.2,0.06045439839363098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,2,power_law_1.2,0.07516800165176392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,power_law_1.01,25.488429260253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,2,power_law_1.2,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,2,power_law_1.2,0.13337600231170654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,2,power_law_1.2,0.13320319652557372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,2,power_law_1.2,0.13595520257949828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,2,power_law_1.2,0.1422592043876648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,2,power_law_1.2,0.13972480297088624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,2,power_law_1.2,0.14791680574417115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,2,power_law_1.2,0.146943998336792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,2,power_law_1.2,0.08318079710006714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,2,power_law_1.2,0.14790400266647338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,2,power_law_1.2,0.0914687991142273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,2,power_law_1.2,0.15667840242385864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,2,power_law_1.2,0.09134719967842102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,2,power_law_1.2,0.126310396194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,2,power_law_1.2,0.16209919452667237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,balanced,0.08901333808898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,2,power_law_1.2,0.12709120512008668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,2,power_law_1.2,0.18729599714279174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,2,power_law_1.2,0.13467520475387573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,balanced,0.12295466661453247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,2,power_law_1.2,0.1475711941719055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,2,power_law_1.2,0.2032383918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,balanced,0.2181333303451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,2,power_law_1.2,0.15958399772644044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,2,power_law_1.2,0.20257279872894288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,balanced,0.21960532665252686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,balanced,0.22089600563049316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,2,power_law_1.2,0.2304896116256714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,2,power_law_1.2,0.1540992021560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,balanced,0.22178133328755698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,2,power_law_1.2,0.278112006187439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,balanced,0.2239733338356018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,2,power_law_1.2,0.15444480180740355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,2,power_law_1.2,0.3021120071411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,balanced,0.22542399168014526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,2,power_law_1.2,0.4110527992248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,balanced,0.2312693397204081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,balanced,0.2336533268292745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,2,power_law_1.2,0.4743360042572021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,2,power_law_1.2,0.15441279411315917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,balanced,0.24175467093785605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,2,power_law_1.2,0.6582848072052002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,2,power_law_1.2,0.16257920265197753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,balanced,0.24110400676727295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,2,power_law_1.2,0.9170623779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,2,power_law_1.2,0.16737279891967774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,balanced,0.24302399158477783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,2,power_law_1.2,1.300979232788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,2,power_law_1.2,0.1993664026260376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,balanced,0.25702933470408124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,2,power_law_1.2,1.7478271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,balanced,0.262992004553477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,2,power_law_1.2,0.1923840045928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,2,power_law_1.2,2.952921676635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,balanced,0.2674986720085144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,2,power_law_1.2,0.2029695987701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,balanced,0.28495999177296955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,2,power_law_1.2,3.9264511108398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,2,power_law_1.2,0.23867518901824952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,balanced,0.058821335434913635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,balanced,0.32948267459869385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,2,power_law_1.2,4.22410888671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,2,power_law_1.2,0.29977600574493407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,balanced,0.33154133955637616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,2,power_law_1.2,0.3962687969207764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,2,power_law_1.2,6.15557746887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,balanced,0.08015466729799907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,balanced,0.43294934431711835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,2,power_law_1.2,0.5721280097961425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,balanced,0.5077066818873087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,balanced,0.12769599755605063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,2,power_law_1.2,14.063845825195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,2,power_law_1.2,0.8581055641174317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,balanced,0.7132746378580729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,balanced,0.13124266266822815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,2,power_law_1.2,1.0971391677856446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,balanced,0.1318986713886261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,balanced,0.9243146578470866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,2,power_law_1.2,1.4079744338989257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,balanced,0.13375999530156454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,2,power_law_1.2,2.631782341003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,balanced,1.383855978647868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,balanced,0.1351040005683899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,2,power_law_1.2,3.1428287506103514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,balanced,0.1361120045185089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,balanced,1.9934666951497395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,2,power_law_1.2,5.063379287719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,balanced,0.13710400462150574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,2,power_law_1.2,5.692038345336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,balanced,0.13914133111635843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,balanced,2.910623868306478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,2,power_law_1.2,7.623334503173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,balanced,0.14101333419481912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,balanced,0.14461333552996317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,2,power_law_1.2,13.21966094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,balanced,3.713856061299642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,balanced,0.1474666694800059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,balanced,0.055359999338785805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,balanced,0.15493333339691162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,balanced,0.07521066566308339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,2,power_law_1.2,30.481414794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,balanced,0.16481600205103555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,balanced,0.12262399991353352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,balanced,4.6201066970825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,balanced,0.1662986675898234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,balanced,0.1269439955552419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,balanced,0.18413333098093668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,balanced,0.1274773379166921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,balanced,0.2108959952990214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,balanced,0.1306880017121633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,balanced,0.23242133855819702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,balanced,0.13368533054987589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,balanced,6.948389053344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,balanced,0.31357866525650024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.0591808021068573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.08784000277519226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,balanced,0.1344000001748403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,balanced,0.37012799580891925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.07346559762954712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.10577919483184814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.07333760261535645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,balanced,0.5206400156021118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.12702080011367797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.21910400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.1236415982246399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,balanced,0.6565653483072916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.21013760566711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.13054720163345337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,balanced,0.13860266407330832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.22564480304718018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.13309439420700073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,balanced,0.14070933063824972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,balanced,0.9607840379079183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.22664320468902588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.13422720432281493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,balanced,15.486031850179037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.2302464008331299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,balanced,1.247541348139445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.138374400138855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.24119679927825927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.1394368052482605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.256499195098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,power_law_1.01,0.05447040200233459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,balanced,1.8125227292378743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.13999359607696532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.24650239944458008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,power_law_1.01,0.06871680021286011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.1457856059074402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.24561920166015624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,power_law_1.01,0.0698751986026764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.14547200202941896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,balanced,0.1461120049158732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.25657598972320556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,power_law_1.01,0.1259071946144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,balanced,2.40993595123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.15159679651260377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,balanced,0.15108266472816467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.29499518871307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,power_law_1.01,0.12485120296478272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.17885440587997437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,balanced,0.15530666708946228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.297107195854187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,power_law_1.01,0.135481595993042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.18785279989242554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,balanced,0.16296533743540445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.3058687925338745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,power_law_1.01,0.1404031991958618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,balanced,3.046127955118815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.18825600147247315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.35600640773773196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,balanced,0.18045334021250406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,power_law_1.01,0.1474943995475769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.21687040328979493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.3877120018005371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,balanced,0.18660267194112143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.2443455934524536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.40623998641967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,balanced,0.20016000668207803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.2730943918228149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.5207808017730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,power_law_1.01,0.14515199661254882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,balanced,0.2685760060946147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.6373695850372314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.3436095952987671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,power_law_1.01,0.15436160564422607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,balanced,4.686234792073567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.855072021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,balanced,0.30959467093149823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,0.40972161293029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,0.5601856231689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.01,1.059539222717285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,balanced,0.4477599859237671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,power_law_1.01,0.15031039714813232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,0.6955455780029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.01,1.507801628112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,balanced,0.5912319819132487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,power_law_1.01,0.15819519758224487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,1.0018752098083497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.01,2.0121408462524415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,power_law_1.01,0.1630911946296692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,balanced,0.8843519687652588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,1.2819583892822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.01,3.00130558013916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,power_law_1.01,0.18067840337753296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,balanced,1.1676106452941895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,1.811564826965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.01,3.964313507080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,power_law_1.01,0.19283839464187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,power_law_1.01,0.2052544116973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,2.4865535736083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,balanced,1.7476906776428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.01,4.933504104614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,balanced,9.209749221801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,power_law_1.01,0.23793280124664307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.01,3.1540672302246096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,power_law_1.01,0.30125439167022705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.01,7.067545318603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,balanced,2.320085366566976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.01,0.36126079559326174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.01,4.660249710083008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.01,0.5203455924987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.01,15.757856750488282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,balanced,3.470458666483561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.01,9.143987274169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.01,0.6481472015380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.01,0.9365119934082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.07745280265808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.01,1.2337471961975097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.09717119932174682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,balanced,4.623253186543782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.01,1.792083168029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.12911360263824462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.01,2.3812543869018556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.21207680702209472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.21867520809173585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.01,3.5199359893798827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,balanced,5.834741592407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.2307584047317505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.01,4.680972671508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.23121919631958007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.01,5.830624008178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.2342911958694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.24572160243988037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,balanced,9.382303873697916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,power_law_1.01,9.402867126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.2610879898071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.2491071939468384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,power_law_1.01,19.094464111328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.25651841163635253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.25910398960113523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.05973759889602661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.2984639883041382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.29825921058654786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.0632960021495819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.07922559976577759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.30349440574645997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.12945280075073243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.35525760650634763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,balanced,19.1473388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.12836480140686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.40132479667663573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.13269120454788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.1374079942703247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.41500158309936525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.13745280504226684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.5337984085083007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.13976320028305053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.14039679765701293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.6584383964538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.1446463942527771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.8824319839477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.14991359710693358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,1,power_law_1.2,1.0993791580200196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.1518720030784607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.17460479736328124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,1,power_law_1.2,1.545356845855713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.18209279775619508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.18654719591140748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,1,power_law_1.2,2.123788833618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.21836159229278565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,1,power_law_1.2,3.0733375549316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.245414400100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.25896320343017576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,1,power_law_1.2,3.9281665802001955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,0.35469439029693606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,0.4045567989349365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,1,power_law_1.2,4.965721511840821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,0.5635263919830322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,0.7089727878570556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,1,power_law_1.2,7.090067291259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,0.9933440208435058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,1.2682880401611327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,1,power_law_1.2,16.080569458007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,1.8292608261108398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,1,power_law_1.2,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,2.5060224533081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,1,power_law_1.2,0.06844800114631652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,1,power_law_1.2,3.1492671966552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,1,power_law_1.2,0.07411839962005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,1,power_law_1.2,4.6615550994873045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,1,power_law_1.2,0.11882239580154419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,1,power_law_1.2,9.007571411132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,1,power_law_1.2,0.12524160146713256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,1,power_law_1.2,0.13423999547958373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,1,power_law_1.2,0.13972480297088624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,1,power_law_1.2,0.14468480348587037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,1,power_law_1.2,0.14381439685821534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,1,power_law_1.2,0.15167360305786132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,1,power_law_1.2,0.1560639977455139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,1,power_law_1.2,0.16004480123519899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,1,power_law_1.2,0.1575744032859802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,1,power_law_1.2,0.18384000062942504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,1,power_law_1.2,0.19425920248031617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,1,power_law_1.2,0.20266239643096923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,1,power_law_1.2,0.23054718971252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,1,power_law_1.2,0.29795839786529543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.2,0.3689471960067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.2,0.5109632015228271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.2,0.6607999801635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.2,0.9351743698120117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.2,1.2181119918823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.2,1.8074495315551757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.2,2.3707008361816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.2,3.508710479736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.2,4.685222244262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.2,5.8596351623535154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,balanced,0.08101333181063335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,1,power_law_1.2,9.282125091552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,balanced,0.1016533374786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,balanced,0.15119999647140503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,1,power_law_1.2,18.813868713378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,balanced,0.27457600831985474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,balanced,0.49489065011342365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,balanced,0.9508000214894613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,balanced,0.0609493354956309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,balanced,0.9528693358103434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,balanced,0.07225599884986877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,balanced,0.9565973281860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,balanced,0.0988159974416097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,balanced,0.16074666380882263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,balanced,0.9581440289815267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,balanced,0.27451733748118085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,balanced,0.9566453297932943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,balanced,0.5026293198267618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,balanced,0.5026559829711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,balanced,0.945904016494751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,balanced,0.5037866830825806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,balanced,0.5048960049947103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,balanced,0.947551965713501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,balanced,0.5081813335418701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.01,0.28492159843444825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,balanced,0.5121013323465983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,balanced,0.9518400033315023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,balanced,0.5125066836675009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,balanced,0.9535253047943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,balanced,0.5208266576131185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.01,0.49025278091430663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,balanced,0.05898133416970571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,balanced,0.5237866640090942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,balanced,0.9618079662322998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,balanced,0.07193600138028462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,balanced,0.5334453185399374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.01,0.2251584053039551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,balanced,0.9647146860758463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,balanced,0.10986133416493733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,balanced,0.5380906661351522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,balanced,0.18017599980036417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,balanced,0.547813336054484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,balanced,0.9746080239613851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.01,0.2725311994552612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,balanced,0.566645344098409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,balanced,0.2762666742006938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.01,0.38068480491638185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.15770879983901978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,balanced,0.4932639996210734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,balanced,1.0171573162078857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,balanced,0.5875786542892456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,balanced,0.4957280158996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.01,0.5078527927398682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.01,0.2681472063064575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,balanced,0.6190239985783895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,balanced,1.0477279822031658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,balanced,0.49755199750264484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.01,0.11121280193328857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.01,0.6807616233825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,balanced,0.6635253429412842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,balanced,1.071397304534912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,balanced,0.5010879834493002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.01,0.1500480055809021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.01,0.7927231788635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,balanced,0.5012906789779663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.01,0.2390592098236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,balanced,0.7196213404337565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.01,0.7574719905853271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,balanced,1.127616008122762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,balanced,0.5060106515884399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.01,0.29374721050262453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.01,0.7848127841949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,balanced,0.5088853438695272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.01,0.3870527982711792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,balanced,0.7916746934254965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,balanced,1.177722692489624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,balanced,0.5140213171641032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.01,0.8005696296691894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.01,0.4150144100189209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,balanced,0.520085334777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.01,0.7771455764770507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.01,0.43143677711486816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,balanced,0.5315146843592325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,balanced,1.230453332265218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,balanced,0.9990346431732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.01,0.8276864051818847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,balanced,0.5379840135574341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.01,0.41721601486206056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.01,0.865561580657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,balanced,0.550981322924296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.01,0.4509888172149658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.01,0.860927963256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.01,0.4418303966522217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,balanced,1.4672692616780598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.01,0.958182430267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.01,0.4550784111022949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,balanced,1.148085355758667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.01,0.9506175994873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.01,0.5085631847381592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.01,1.0556096076965331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.01,0.5283328056335449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,balanced,0.5792266527811686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,balanced,1.5710293451944988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.01,1.1327679634094239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.01,0.5451839923858642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.01,0.5313856124877929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.01,1.2863615989685058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,balanced,1.5391093889872234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.01,0.6173247814178466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,0.619379186630249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,8,power_law_1.2,0.2915328025817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.01,1.2400511741638183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,0.6894976139068604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,8,power_law_1.2,0.4679296016693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,balanced,2.032778739929199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,0.7278528213500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.01,1.4780096054077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,balanced,0.6111893256505331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,8,power_law_1.2,0.19154560565948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.01,1.5919743537902833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,0.8568127632141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,8,power_law_1.2,0.26917119026184083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,power_law_1.01,0.1691648006439209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,balanced,0.664522647857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.01,2.100998306274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,0.918284797668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,8,power_law_1.2,0.380947208404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,power_law_1.01,0.2843967914581299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.01,2.4537023544311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,1.1904383659362794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,8,power_law_1.2,0.5100863933563232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,balanced,1.9279680252075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,balanced,0.7213173707326254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,power_law_1.01,0.13526400327682495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.01,3.294630432128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,1.557759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,8,power_law_1.2,0.6846975803375244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,power_law_1.01,0.1681023955345154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.01,4.4021247863769535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,2.2084415435791014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,8,power_law_1.2,0.7169856071472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,balanced,0.8394719759623209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,power_law_1.01,0.2224191904067993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,balanced,2.56276273727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.01,5.617248153686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,8,power_law_1.2,0.7227392196655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,power_law_1.01,0.2962752103805542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,2.7498111724853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,power_law_1.01,0.3823872089385986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,8,power_law_1.2,0.7788159847259521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.01,7.70738525390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,balanced,0.9418933391571045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.01,3.460076904296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,power_law_1.01,0.4286464214324951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,8,power_law_1.2,0.7759744167327881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,power_law_1.01,0.4318784236907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,8,power_law_1.2,0.8613311767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.01,4.917299270629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.01,15.160281372070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,power_law_1.01,0.4439295768737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,8,power_law_1.2,0.8558464050292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,balanced,1.3492213884989421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,balanced,2.3648746808369956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,power_law_1.01,0.45630722045898436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.01,9.852710723876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,8,power_law_1.2,0.8804608345031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,power_law_1.01,0.47292799949645997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,8,power_law_1.2,0.9367103576660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,power_law_1.01,0.4942272186279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,balanced,3.122506777445475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,8,power_law_1.2,0.9555071830749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,power_law_1.01,0.5228864192962647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,balanced,1.542741298675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,8,power_law_1.2,1.0080767631530763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,power_law_1.01,0.5400383949279786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,8,power_law_1.2,1.1516863822937011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,power_law_1.01,0.5682112216949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,power_law_1.01,0.6479680061340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,8,power_law_1.2,1.2432512283325194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,8,power_law_1.2,1.4151935577392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,power_law_1.01,0.7092160224914551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,8,power_law_1.2,1.35099515914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,balanced,2.248762607574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,8,power_law_1.2,1.6651968002319335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,8,power_law_1.2,1.8037759780883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.01,0.6768640041351318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,balanced,3.6164747873942056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,8,power_law_1.2,2.4762943267822264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.01,0.8219967842102051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.01,1.0045439720153808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,8,power_law_1.2,3.1431743621826174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.01,1.0982272148132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,balanced,4.876336097717285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,8,power_law_1.2,4.284595108032226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.01,1.4347392082214356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,balanced,2.9817492167154946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,8,power_law_1.2,5.250182342529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.01,2.012883186340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,8,power_law_1.2,6.294496154785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.01,2.720992088317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.17778559923171997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.01,3.8015487670898436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,8,power_law_1.2,0.2567231893539429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,8,power_law_1.2,9.539116668701173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,8,power_law_1.2,0.11507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.01,4.707923126220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,8,power_law_1.2,0.15323519706726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,power_law_1.01,5.519891357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,power_law_1.2,19.226284790039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,8,power_law_1.2,0.217523193359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,8,power_law_1.2,0.24367361068725585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.01,9.304128265380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,8,power_law_1.2,0.36521599292755125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,balanced,3.7020320892333984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,8,power_law_1.2,0.3937920093536377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,8,power_law_1.2,0.39647998809814455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.01,18.586329650878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,8,power_law_1.2,0.42783360481262206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,8,power_law_1.2,0.44352002143859864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,8,power_law_1.2,0.44109439849853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,8,power_law_1.2,0.5012800216674804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,8,power_law_1.2,0.4897024154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,8,power_law_1.2,0.5450111865997315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,8,power_law_1.2,0.554527997970581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,8,power_law_1.2,0.5808320045471191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,8,power_law_1.2,0.686297607421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,0.6534783840179443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,0.789574384689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,balanced,6.919877370198567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,0.8148672103881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,balanced,6.10262934366862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,0.9134143829345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,8,balanced,9.659519831339518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,1.0391807556152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,1.5594752311706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,1.6990272521972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,2.6067968368530274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,3.0151744842529298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,8,power_law_1.2,3.9530689239501955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,8,power_law_1.2,6.563129425048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,8,power_law_1.2,12.909312438964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,balanced,12.671381632486979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,balanced,0.07566933333873749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,balanced,0.1009279986222585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,balanced,0.15227199594179788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,balanced,0.27428267399470013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,balanced,0.49643198649088544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,8,power_law_1.2,0.18687360286712645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,balanced,0.9462026755015055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,balanced,0.9497120380401611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,8,power_law_1.2,0.2737344026565552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,balanced,0.9539626439412435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,8,power_law_1.2,0.09822720289230347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,balanced,0.9581066767374674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,balanced,0.9637386798858643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,8,power_law_1.2,0.16081279516220093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,balanced,0.953167994817098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,8,power_law_1.2,0.19731199741363525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,balanced,0.9594613711039225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,balanced,0.9633973439534506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,8,power_law_1.2,0.2670783996582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,balanced,0.9679413636525472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,8,power_law_1.2,0.38689279556274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,balanced,0.9769706726074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,8,power_law_1.2,0.3834944009780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,balanced,0.98417067527771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,8,power_law_1.2,0.39864320755004884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,balanced,0.9986613591512045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,8,power_law_1.2,0.40307841300964353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,balanced,1.0443893273671467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,8,power_law_1.2,0.4704768180847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,balanced,1.0785173575083415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,8,power_law_1.2,0.4755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,8,power_law_1.2,0.502348804473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,balanced,1.1137866973876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,8,power_law_1.2,0.5483136177062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,8,power_law_1.2,0.5651648044586182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,balanced,1.1957759857177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,8,power_law_1.2,0.6392127990722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,8,power_law_1.2,0.7276224136352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,balanced,1.263445297876994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,8,power_law_1.2,0.7459839820861817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,balanced,1.3476853370666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.2,0.712063980102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,balanced,1.6143466631571453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.2,0.8947967529296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.2,1.0730112075805665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,balanced,0.05779733260472616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.2,1.244326400756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,balanced,0.07285333176453908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,balanced,1.7730239232381184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.2,1.6192127227783204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,balanced,0.10081066687901814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.2,2.1768896102905275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,balanced,0.16234667102495828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.2,2.989574432373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,balanced,0.2759360074996948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,balanced,0.5051253239313761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.2,4.432883071899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,balanced,0.5060906807581583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,balanced,0.5106186469395956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.2,5.952531051635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,balanced,0.5166026751200358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,balanced,2.242234706878662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,balanced,0.5121226708094279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,8,power_law_1.2,6.614457702636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,balanced,0.5195146799087524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,balanced,0.5253706773122152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,balanced,0.5295413335164388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.2,10.592813110351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,balanced,0.535536011060079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,balanced,0.5476320187250773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,balanced,0.5509920120239258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.2,23.258099365234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,balanced,0.5644853512446085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,balanced,0.5836213429768881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,balanced,0.06800533334414165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,balanced,2.922346750895182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.01,0.10856959819793702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,balanced,0.6134933233261108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,balanced,0.07901866734027863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.01,0.15515520572662353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.01,0.17404799461364745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,balanced,0.11361599961916606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.01,0.09425920248031616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,balanced,0.6617386738459269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.01,0.26476800441741943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,balanced,0.18634132544199625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.01,0.14394240379333495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.01,0.14666880369186402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.01,0.2509759902954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,balanced,0.30905600388844806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,balanced,0.7140586376190186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.01,0.21325440406799318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.01,0.3765120029449463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,balanced,0.5119146505991617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.01,0.29136641025543214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.01,0.4679743766784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,balanced,0.5158079862594604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.01,0.7068992137908936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,balanced,0.797322670618693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.01,0.35791358947753904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.01,0.7117695808410645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,balanced,0.5196533203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.01,0.41363840103149413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.01,0.7560128211975098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,balanced,3.5314133961995444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,balanced,0.5227893193562826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.01,0.3992640018463135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.01,0.7469759941101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,balanced,0.9027360280354818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,balanced,0.5234560171763102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,balanced,0.5298453172047933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.01,0.8040063858032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.01,0.4025599956512451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,balanced,0.5371786753336588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.01,0.8371711730957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.01,0.4239039897918701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,balanced,0.5429919958114624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.01,0.848243236541748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,balanced,1.1241119702657063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.01,0.4493824005126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.01,0.8570303916931152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,balanced,0.5537973244984945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.01,0.8574336051940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.01,0.44814720153808596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,balanced,0.5672373374303182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.01,0.9070143699645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.01,0.47560958862304686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,balanced,0.5760053396224976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.01,0.9427200317382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,power_law_1.01,0.12412799596786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.01,0.5097023963928222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,balanced,0.5951840082804362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.01,1.008191967010498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,power_law_1.01,0.17303040027618408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,balanced,1.3139413197835286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.01,0.5190080165863037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.01,1.0755776405334472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,power_law_1.01,0.10207359790802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.01,1.263424015045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.01,0.5486976146697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,power_law_1.01,0.15648000240325927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.01,1.2834112167358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.01,0.5935167789459228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.01,1.4768832206726075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,power_law_1.01,0.22361600399017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.01,1.5335807800292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,balanced,0.6393386522928873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.01,0.614188814163208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,power_law_1.01,0.2786175966262817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,balanced,6.186896006266276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.01,2.0152063369750977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.01,0.7181056022644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,power_law_1.01,0.3638528108596802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.01,2.4539199829101563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,balanced,1.7766559918721516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,power_law_1.01,0.3837183952331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.01,0.7518847942352295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.01,3.256710433959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,power_law_1.01,0.4183231830596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.01,0.8743616104125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.01,4.410201644897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,power_law_1.01,0.4372992038726807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.01,1.0005887985229491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.01,4.969785690307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,power_law_1.01,0.44786558151245115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,4,power_law_1.2,0.17381759881973266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.01,1.2995712280273437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,balanced,0.7004373073577881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.01,7.85374755859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,power_law_1.01,0.48061442375183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,4,power_law_1.2,0.25428481101989747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.01,1.6351936340332032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,power_law_1.01,0.49007358551025393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,balanced,0.7916639645894369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,4,power_law_1.2,0.1413823962211609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.01,15.399591064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.01,2.187590408325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,power_law_1.01,0.5208896160125732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,balanced,2.3449920018514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,4,power_law_1.2,0.20396161079406738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,balanced,0.8678507010142008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,power_law_1.01,0.5521344184875489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.01,2.822438430786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,4,power_law_1.2,0.33254399299621584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,power_law_1.01,0.5924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,4,power_law_1.2,0.4329984188079834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.01,3.7955455780029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,balanced,1.0517600377400715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,power_law_1.01,0.6622335910797119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,4,power_law_1.2,0.6661824226379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.01,5.477881622314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,4,power_law_1.2,0.697599983215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,balanced,1.2134026686350505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,power_law_1.01,0.6987199783325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,4,power_law_1.2,0.7280320167541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.01,10.883814239501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,4,power_law_1.2,0.8020799636840821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,4,power_law_1.2,0.8051584243774415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,power_law_1.01,0.7390399932861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,balanced,1.7896000544230144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,balanced,2.81929079691569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,4,power_law_1.2,0.8048192024230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,power_law_1.01,0.8508799552917481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,power_law_1.01,1.0499711990356446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,4,power_law_1.2,0.8683712005615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,power_law_1.01,1.2659392356872559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,4,power_law_1.2,0.8434368133544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,balanced,2.1157919565836587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,power_law_1.01,1.6466175079345704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,4,power_law_1.2,0.8971199989318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,4,power_law_1.2,0.8993727684020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,power_law_1.01,2.1329727172851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,4,power_law_1.2,1.0137408256530762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,power_law_1.01,2.673747253417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,balanced,10.81491724650065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,4,power_law_1.2,1.0929408073425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,power_law_1.01,3.9094593048095705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,4,power_law_1.2,1.1549311637878419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,balanced,3.0831521352132163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,power_law_1.01,5.354624176025391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,4,power_law_1.2,1.3607423782348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,4,power_law_1.2,1.3303744316101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,power_law_1.01,6.495136260986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,4,power_law_1.2,1.5567935943603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,balanced,4.45470396677653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,4,power_law_1.2,1.7791807174682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,power_law_1.01,10.114943695068359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,4,power_law_1.2,2.3014080047607424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,4,power_law_1.2,2.7046911239624025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,balanced,4.107306798299153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,power_law_1.01,21.487942504882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,4,power_law_1.2,3.7865856170654295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,4,power_law_1.2,5.158060836791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,4,power_law_1.2,5.5402687072753904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,4,power_law_1.2,9.02877426147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,balanced,5.050058682759603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,4,power_law_1.2,16.686297607421874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,4,power_law_1.2,0.10880639553070068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,4,power_law_1.2,0.14874240159988403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,4,power_law_1.2,0.08482559919357299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,4,power_law_1.2,0.14140160083770753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,4,power_law_1.2,0.19170559644699098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,4,power_law_1.2,0.2567231893539429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,4,power_law_1.2,0.3773952007293701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,4,power_law_1.2,0.3859519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,balanced,8.296538670857748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,4,power_law_1.2,0.40200958251953123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,balanced,8.837658564249674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,4,power_law_1.2,0.3928704023361206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,4,power_law_1.2,0.43450241088867186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,4,power_law_1.2,0.44573440551757815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,4,power_law_1.2,0.4823296070098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,4,power_law_1.2,0.48490238189697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,4,power_law_1.2,0.5436160087585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,4,power_law_1.2,0.5617472171783447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,4,power_law_1.2,0.5607744216918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,4,power_law_1.2,0.6406655788421631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,4,power_law_1.2,0.6514944076538086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,4,power_law_1.2,0.7521088123321533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,4,power_law_1.2,0.8031744003295899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,4,power_law_1.2,0.9066304206848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,4,power_law_1.2,1.068006420135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,4,power_law_1.2,1.3750016212463378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,4,power_law_1.2,1.7413503646850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,4,power_law_1.2,2.555014419555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,4,power_law_1.2,3.074880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,4,power_law_1.2,3.88592643737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,4,power_law_1.2,0.12358399629592895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,4,power_law_1.2,5.7627521514892575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,4,power_law_1.2,0.1712448000907898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,balanced,16.39575958251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,4,power_law_1.2,0.09948800206184387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,4,power_law_1.2,12.037996673583985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,4,power_law_1.2,0.14280320405960084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,balanced,0.07688533266385396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,4,power_law_1.2,0.18661119937896728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,balanced,0.10319466392199199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,4,power_law_1.2,0.26024959087371824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,balanced,0.15205867091814676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,4,power_law_1.2,0.3573184013366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,balanced,0.2686186631520589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,4,power_law_1.2,0.4021632194519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,balanced,0.5045813322067261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,4,power_law_1.2,0.41603841781616213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,4,power_law_1.2,0.4224063873291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,balanced,0.9689439932505289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,4,power_law_1.2,0.46501760482788085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,balanced,0.9690666993459066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,4,power_law_1.2,0.4874559879302979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,balanced,0.9767786661783854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,4,power_law_1.2,0.48906879425048827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,balanced,0.9811200300852457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,4,power_law_1.2,0.5569215774536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,balanced,0.9844640096028646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,4,power_law_1.2,0.5713151931762696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,balanced,0.9729440212249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,balanced,0.9833013216654459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,4,power_law_1.2,0.5914624214172364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,balanced,0.9861066341400146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,4,power_law_1.2,0.6862592220306396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,balanced,0.05995733539263407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,balanced,0.9967626730600992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,balanced,0.07404266794522603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,balanced,1.0131680170694988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,4,power_law_1.2,0.7687551975250244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,balanced,0.10206400354703267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,balanced,1.0145333607991536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,balanced,0.1662453313668569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,balanced,0.2828320066134135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,balanced,1.031615972518921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,balanced,0.5197279850641886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,4,power_law_1.2,0.7661375999450684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,balanced,0.5225119988123575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,balanced,1.0794666608174641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,4,power_law_1.2,0.9313983917236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,balanced,0.5232053200403849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,4,power_law_1.2,1.0826623916625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,balanced,1.124901294708252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,balanced,0.5256640116373698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,4,power_law_1.2,1.411417579650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,balanced,0.5269706646601359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,balanced,1.1850879987080891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,4,power_law_1.2,1.6553216934204102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,balanced,0.5306133429209391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,balanced,0.5344053506851196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,4,power_law_1.2,2.2870527267456056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,balanced,1.2789599895477295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,balanced,0.5435946782430013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,4,power_law_1.2,2.8704896926879884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,balanced,0.5506133238474528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,balanced,0.5633653402328491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,balanced,1.416602611541748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,4,power_law_1.2,4.398425674438476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,balanced,0.08795199791590373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,balanced,0.5712266763051351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,balanced,0.09594133496284485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,4,power_law_1.2,6.048550415039062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,balanced,0.5883040030797323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.01,0.107750403881073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,balanced,0.12733333309491476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,balanced,1.579525311787923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,balanced,0.19821866353352866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,4,power_law_1.2,7.392530822753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,balanced,0.6205706596374512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.01,0.15425280332565308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,balanced,0.297760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.01,0.13979519605636598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,balanced,0.6759466330210367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,4,power_law_1.2,10.375750732421874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,balanced,0.5310186545054117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.01,0.20505599975585936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,balanced,1.9081279436747234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,balanced,0.5352853139241537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,balanced,0.741541306177775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.01,0.35612800121307375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,balanced,0.5410186847050985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,4,power_law_1.2,23.72443542480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,balanced,0.8126826286315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.01,0.4721343994140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,balanced,0.5440213282903036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,balanced,0.5508533318837484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.01,0.6648384094238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,balanced,2.2246665954589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,balanced,0.9566986560821533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,balanced,0.5593973398208618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.01,0.7213312149047851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,balanced,0.5683679978052775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.01,0.7402368068695069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,balanced,0.5777866840362549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.01,0.766540813446045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,balanced,1.1170612970987956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,balanced,0.5909920136133829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.01,0.8009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,balanced,0.6120160023371378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.01,0.8458239555358886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,balanced,0.629525343577067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,balanced,2.9849281311035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,balanced,1.4399040540059407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.01,0.8342975616455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,balanced,0.6697386900583903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.01,0.8755647659301757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.01,0.9209024429321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.01,0.9316736221313476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,balanced,1.795082728068034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.01,0.9592831611633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,balanced,0.7579466501871744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.01,1.0145983695983887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.01,0.07294080257415772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.01,1.1111295700073243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,balanced,3.7641706466674805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.01,1.2798527717590331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.01,0.09933440089225769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.01,0.08164479732513427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.01,1.2628864288330077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,balanced,2.5374719301859536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.01,0.12865279912948607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.01,1.4766271591186524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,balanced,0.8568426767985026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.01,0.20599679946899413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.01,1.6358207702636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.01,0.26423680782318115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,balanced,1.01145601272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.01,2.1930368423461912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.01,0.3611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.01,2.6517120361328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,balanced,1.150703986485799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.01,0.40158720016479493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.01,3.6507648468017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,balanced,4.627445220947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.01,0.40395522117614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,balanced,1.4954613049825032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,balanced,3.035264015197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.01,0.4084799766540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.01,4.51712646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.01,0.41575040817260744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.01,5.572544097900391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.01,0.4577343940734863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,balanced,1.7860639890034993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.01,0.44645118713378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.01,9.717996978759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.01,0.490828800201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.01,0.519488000869751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,balanced,2.626805305480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.01,0.5426559925079346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.01,16.461363220214842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.01,0.5668543815612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.01,0.6131455898284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,balanced,3.883397420247396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.01,0.6670591831207275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,balanced,3.232693354288737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.01,0.7645823955535889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.01,0.8197952270507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,balanced,7.349685033162435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.01,0.9883071899414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,2,power_law_1.2,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.01,1.1356863975524902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,2,power_law_1.2,0.14718719720840454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.01,1.507033634185791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,2,power_law_1.2,0.11824640035629272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,balanced,4.757354736328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,power_law_1.01,0.09987840056419373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,2,power_law_1.2,0.19752320051193237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.01,1.9330303192138671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,2,power_law_1.2,0.31468160152435304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,power_law_1.01,0.12919039726257325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.01,2.8476032257080077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,2,power_law_1.2,0.42070398330688474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,power_law_1.01,0.11177599430084229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,2,power_law_1.2,0.6151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.01,3.3994945526123046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,power_law_1.01,0.14780160188674926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,2,power_law_1.2,0.7131264209747314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,power_law_1.01,0.22199039459228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,2,power_law_1.2,0.7291391849517822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.01,4.260710525512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,2,power_law_1.2,0.7426943778991699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,balanced,5.815845489501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,power_law_1.01,0.28894720077514646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,2,power_law_1.2,0.8196991920471192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,power_law_1.01,0.3772671937942505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.01,6.789446258544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,2,power_law_1.2,0.8225791931152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,balanced,6.3350880940755205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,power_law_1.01,0.42291841506958006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,2,power_law_1.2,0.8389632225036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,power_law_1.01,0.43894400596618655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,2,power_law_1.2,0.8977151870727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.01,13.408428955078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,2,power_law_1.2,0.9447232246398926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,power_law_1.01,0.45151357650756835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,2,power_law_1.2,0.9854144096374512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,power_law_1.01,0.4724031925201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,2,power_law_1.2,1.0114239692687987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,power_law_1.01,0.4979072093963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,2,power_law_1.2,1.1079232215881347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,2,power_law_1.2,1.1794303894042968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,power_law_1.01,0.5291967868804932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,2,power_law_1.2,1.3458623886108398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,power_law_1.01,0.574124813079834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,2,power_law_1.2,1.3835904121398925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,2,power_law_1.2,1.5331904411315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,power_law_1.01,0.6219071865081787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,2,power_law_1.2,1.8249343872070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,balanced,7.83958371480306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,power_law_1.01,0.6359744071960449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,2,power_law_1.2,2.339411163330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,power_law_1.01,0.7257984161376954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,2,power_law_1.2,2.75229434967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,2,power_law_1.2,4.084358215332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,2,power_law_1.2,4.918719863891601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,power_law_1.01,0.8122112274169921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,balanced,14.441083272298178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,2,power_law_1.2,6.481139373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,power_law_1.01,0.8714943885803222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,2,power_law_1.2,9.342393493652343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,power_law_1.01,1.0768256187438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,power_law_1.01,1.3293824195861816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,2,power_law_1.2,16.963655090332033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,power_law_1.01,1.6129919052124024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,power_law_1.01,2.1014272689819338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,power_law_1.01,2.9386816024780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,balanced,12.838308970133463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,balanced,11.58627192179362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,power_law_1.01,3.7796607971191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,2,power_law_1.2,0.07681279778480529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,power_law_1.01,5.3315776824951175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,2,power_law_1.2,0.09470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,power_law_1.01,7.115155029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,2,power_law_1.2,0.08312960267066956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,2,power_law_1.2,0.12183680534362792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,power_law_1.01,8.565849304199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,2,power_law_1.2,0.1830016016960144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,2,power_law_1.2,0.24112000465393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,power_law_1.01,13.287213134765626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,2,power_law_1.2,0.36922879219055177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,2,power_law_1.2,0.38489599227905275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,power_law_1.01,27.562771606445313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,2,power_law_1.2,0.3929408073425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,2,power_law_1.2,0.42249598503112795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,2,power_law_1.2,0.43466877937316895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,2,power_law_1.2,0.4622079849243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,2,power_law_1.2,0.4689216136932373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,2,power_law_1.2,0.4973504066467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,2,power_law_1.2,0.5408319950103759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,2,power_law_1.2,0.568339204788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,2,power_law_1.2,0.5708159923553466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,2,power_law_1.2,0.6593855857849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,2,power_law_1.2,0.6938176155090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,2,power_law_1.2,0.7941247940063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,2,power_law_1.2,0.877286434173584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,balanced,26.34050750732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,2,power_law_1.2,1.038771152496338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,2,power_law_1.2,1.202073574066162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,2,power_law_1.2,1.564896011352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,2,power_law_1.2,1.9636863708496093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,2,power_law_1.2,2.797235107421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,2,power_law_1.2,3.671315383911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,2,power_law_1.2,4.575276947021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,2,power_law_1.2,7.48108139038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,2,power_law_1.2,0.09966080188751221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,2,power_law_1.2,14.145298767089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,2,power_law_1.2,0.12775039672851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,2,power_law_1.2,0.10419199466705323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,2,power_law_1.2,0.14482560157775878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,2,power_law_1.2,0.19907840490341186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,2,power_law_1.2,0.2564287900924683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,2,power_law_1.2,0.370412802696228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,2,power_law_1.2,0.4125631809234619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,2,power_law_1.2,0.42665600776672363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,2,power_law_1.2,0.4505983829498291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,balanced,0.07906133433183034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,2,power_law_1.2,0.488646411895752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,balanced,0.10380799571673076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,2,power_law_1.2,0.5083199977874756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,balanced,0.15588266650835672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,balanced,0.2718293269475301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,2,power_law_1.2,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,balanced,0.512175997098287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,2,power_law_1.2,0.5811520099639893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,balanced,0.9782666365305582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,2,power_law_1.2,0.6194111824035644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,balanced,0.9888479709625244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,2,power_law_1.2,0.6429183959960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,balanced,0.9983039697011312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,2,power_law_1.2,0.7873087882995605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,balanced,1.0137386322021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,balanced,1.0127039750417073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,balanced,0.9987839857737223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,2,power_law_1.2,0.8432512283325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,balanced,1.005343993504842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,balanced,1.0130293369293213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,balanced,0.0618453323841095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,balanced,1.013535976409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,2,power_law_1.2,0.9252991676330566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,balanced,0.07812266548474629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,balanced,1.024458646774292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,2,power_law_1.2,1.1186304092407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,balanced,0.1074773371219635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,balanced,1.0381813049316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,balanced,0.1721386710802714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,2,power_law_1.2,1.3717568397521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,balanced,0.29448533058166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,balanced,1.061018705368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,balanced,0.5371626615524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,2,power_law_1.2,1.8692352294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,balanced,0.5464160044987997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,2,power_law_1.2,2.165318489074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,balanced,1.1538293361663818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,balanced,0.553114652633667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,balanced,0.5593279997507731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,2,power_law_1.2,2.9191167831420897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.0763647973537445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,balanced,1.2325493494669597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,balanced,0.12918399771054587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,balanced,0.566757321357727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,2,power_law_1.2,3.889081573486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.10343040227890014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,balanced,0.5754719972610474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,balanced,0.13749866684277853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,balanced,1.3659626642862956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.11012480258941651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,balanced,0.5919839938481649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,balanced,0.15777599811553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,2,power_law_1.2,5.754585647583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,balanced,0.5998506546020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,balanced,0.22338666518529257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.2207360029220581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,balanced,1.496554692586263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,2,power_law_1.2,7.237088012695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,balanced,0.3461600144704183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,balanced,0.6358933448791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.3412544012069702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,balanced,0.6071093479792277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,balanced,0.6569493214289347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,balanced,1.7549386024475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.4655360221862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,2,power_law_1.2,8.783090972900391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,balanced,0.6146986484527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,balanced,0.6613173484802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.6762176036834717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,balanced,0.6247413158416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,balanced,0.6933333079020182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,2,power_law_1.2,14.004013061523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,balanced,2.0385759671529136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.7155903816223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,balanced,0.6336586475372314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,balanced,0.6388373374938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.7348991870880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,balanced,0.7299199899037679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,balanced,0.6533173322677612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.7883520126342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,balanced,0.8216266632080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,balanced,0.6702826817830404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,2,power_law_1.2,29.9047119140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,balanced,2.704287846883138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.8278464317321778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,balanced,0.6835626761118571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,balanced,0.955018679300944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.8251839637756347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,balanced,0.7232159773508707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,balanced,0.7638986905415853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.8595647811889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,balanced,1.007258653640747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,balanced,0.7982186476389567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.8893952369689941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.058374398946762086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,balanced,3.4206933975219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,balanced,0.861962636311849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.9262847900390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,balanced,1.2730240027109783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.07512320280075073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.9570367813110352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.08296319842338562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.9947327613830567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,balanced,1.5617012977600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.14464000463485718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.01,1.135155200958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,balanced,1.0150187015533447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.20903680324554444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.01,1.2344511985778808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.01,0.26987519264221194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,balanced,4.744496027628581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.01,1.457254409790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,balanced,2.14411195119222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.01,0.3861952066421509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.01,1.5172736167907714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.01,0.4213568210601807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.8381568908691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.01,0.4357312202453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.01,2.037260818481445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.01,0.4395455837249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.01,2.641856002807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.01,0.47699837684631347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,balanced,1.2455360094706218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,balanced,2.7532533009847007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.01,0.514796781539917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.01,3.242931365966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,balanced,1.550399939219157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.01,0.5333759784698486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.01,4.511219024658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.01,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,balanced,5.496896107991536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,balanced,1.7345493634541829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.01,0.6014463901519775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.01,5.9091136932373045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.01,0.6393407821655274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,balanced,2.4420533180236816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.01,7.343807983398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,power_law_1.01,0.1188480019569397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.01,0.6654335975646972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,balanced,3.9733174641927085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.01,0.7426752090454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,power_law_1.01,0.13178240060806273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.01,11.620486450195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,balanced,2.9147094090779624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,0.7993599891662597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,power_law_1.01,0.14369280338287355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,power_law_1.01,0.19585920572280885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,0.9601728439331054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.01,19.964358520507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,power_law_1.01,0.2602751970291138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,1.0257023811340331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,power_law_1.01,0.32337279319763185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,balanced,4.59386666615804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,power_law_1.01,0.4353792190551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,balanced,6.98640505472819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,1.289958381652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,power_law_1.01,0.47920641899108884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,balanced,4.732661247253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,1.5406335830688476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,power_law_1.01,0.49084157943725587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,2.0683008193969727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,power_law_1.01,0.5172160148620606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.07616639733314515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,balanced,5.675519943237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,2.6274688720703123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,power_law_1.01,0.5504576206207276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.10069119930267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,power_law_1.01,0.5711935997009278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,3.731622314453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.12050559520721435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,power_law_1.01,0.6213056087493897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,5.022169494628907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.20723199844360352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,power_law_1.01,0.68853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.3048896074295044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.01,6.1908927917480465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,power_law_1.01,0.7594240188598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,balanced,8.372959772745768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.42684159278869627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,balanced,6.048496246337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,power_law_1.01,0.8140095710754395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.01,8.75726089477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.6551871776580811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,power_law_1.01,0.9323391914367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.680940818786621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.01,16.89557800292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.7335360050201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,balanced,10.325429280598959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,power_law_1.01,1.0959551811218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.7791999816894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.7757631778717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,balanced,11.038522084554037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.8301568031311035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.01,1.2159487724304199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.852467155456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.01,1.5614080429077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.9094655990600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.01,1.915001678466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.9579008102416993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.01,2.520921516418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,1,power_law_1.2,1.0088704109191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.01,3.2054721832275392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,1,power_law_1.2,1.0279552459716796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,balanced,8.809530893961588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.01,4.5164031982421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,1,power_law_1.2,1.1594688415527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.01,5.848998260498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,balanced,13.646010080973307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,1,power_law_1.2,1.3060288429260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.01,8.452556610107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,1,power_law_1.2,1.4781760215759276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,1,power_law_1.2,1.5702400207519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.01,11.082112121582032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.8788032531738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,1,power_law_1.2,2.175462341308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.01,13.70142059326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,1,power_law_1.2,2.7276416778564454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,1,power_law_1.2,3.3870655059814454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,power_law_1.01,21.63936004638672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,1,power_law_1.2,4.593068695068359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,1,power_law_1.2,6.19343376159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,1,power_law_1.2,7.650470733642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,power_law_1.01,42.989010620117185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,1,power_law_1.2,11.65905303955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,balanced,21.564910888671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,balanced,19.80619176228841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,1,power_law_1.2,20.313824462890626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.059724801778793336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.07530239820480347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,balanced,17.87938690185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.08438400030136109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.13447680473327636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.17834880352020263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.2532671928405762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,1,power_law_1.2,0.3689471960067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,1,power_law_1.2,0.39993600845336913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,1,power_law_1.2,0.43236479759216306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,1,power_law_1.2,0.44131197929382326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,1,power_law_1.2,0.4630080223083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,1,power_law_1.2,0.5023935794830322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,1,power_law_1.2,0.5325119972229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,1,power_law_1.2,0.5717696189880371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,1,power_law_1.2,0.5945792198181152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,1,power_law_1.2,0.640831995010376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,balanced,43.78117879231771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,1,power_law_1.2,0.6673408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,1,power_law_1.2,0.75764479637146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,0.8167936325073242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,0.9756031990051269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,1.0741312026977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,1,power_law_1.2,0.11619839668273926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,1.3112768173217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,1,power_law_1.2,0.13194880485534669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,1,power_law_1.2,0.14336639642715454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,1.5796095848083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,1,power_law_1.2,0.1867583990097046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,2.1130239486694338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,1,power_law_1.2,0.23464319705963135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,2.6570688247680665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,1,power_law_1.2,0.3103424072265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,3.7899711608886717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,1,power_law_1.2,0.4335296154022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,5.047814559936524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,1,power_law_1.2,0.45788798332214353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,balanced,0.02834133307139079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,1,power_law_1.2,0.4908160209655762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,1,power_law_1.2,6.291692733764648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,balanced,0.0278613343834877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,1,power_law_1.2,0.5082880020141601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,balanced,0.03263466556866964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,1,power_law_1.2,0.5593791961669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,balanced,0.05091199775536855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,1,power_law_1.2,8.66924819946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,balanced,0.07321600119272868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,1,power_law_1.2,0.5892479896545411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,balanced,0.07207466661930084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,1,power_law_1.2,0.6330048084259033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,balanced,0.07526933153470357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,1,power_law_1.2,16.75275573730469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,1,power_law_1.2,0.7093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,balanced,0.07563733557860057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,balanced,0.07573333382606506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,1,power_law_1.2,0.7625343799591064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,balanced,0.0764213353395462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,balanced,0.07540800174077351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,1,power_law_1.2,0.8278464317321778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,balanced,0.07615466912587483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,1,power_law_1.2,0.9510144233703614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,balanced,0.07564266522725423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,balanced,0.08082133531570435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,balanced,0.08398933211962382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,balanced,0.08667733271916707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,1,power_law_1.2,1.128927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,balanced,0.0853760043780009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,balanced,0.09327999750773112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,balanced,0.10727999607721965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.2,1.2557439804077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,balanced,0.11396267016728719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.2,1.5942272186279296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,balanced,0.11930666367212932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.2,1.9421823501586915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.2,2.5614656448364257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,balanced,0.13751999537150064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.2,3.2057151794433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.2,4.523846435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,balanced,0.15660267074902853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.2,5.849606323242187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.2,8.43059844970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,balanced,0.2079306642214457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.2,11.046669006347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.2,13.67574462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,balanced,0.2338506579399109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,1,power_law_1.2,21.4891845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,balanced,0.03290133426586787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,balanced,0.3330026666323344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,balanced,0.03195200115442276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,power_law_1.01,0.04967679977416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,1,power_law_1.2,42.53972473144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,balanced,0.03366400053103765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,balanced,0.039018665750821434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,power_law_1.01,0.03952000141143799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,balanced,0.058890665570894875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,power_law_1.01,0.036800000071525577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,power_law_1.01,0.039750400185585025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,power_law_1.01,0.0455808013677597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,balanced,0.06081599990526835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,power_law_1.01,0.05241600275039673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,balanced,0.061530664563179016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,power_law_1.01,0.06501759886741638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,balanced,0.06086933116118113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,power_law_1.01,0.03416320085525513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,power_law_1.01,0.07184640169143677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,balanced,0.026416001220544178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,balanced,0.06140799820423126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,power_law_1.01,0.07195519804954528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,balanced,0.41978132724761963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,power_law_1.01,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,balanced,0.06176533301671346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,power_law_1.01,0.07275519967079162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,balanced,0.02809600035349528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,power_law_1.01,0.047366398572921756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,power_law_1.01,0.07486720085144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,balanced,0.06241600215435028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,balanced,0.02962133288383484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,power_law_1.01,0.07973120212554932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,power_law_1.01,0.05869439840316772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,balanced,0.06260799864927928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,balanced,0.03398933261632919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,power_law_1.01,0.08288639783859253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,power_law_1.01,0.057004797458648684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,balanced,0.05295466880003611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,balanced,0.06379733482996623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,power_law_1.01,0.08229759931564332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,power_law_1.01,0.059487998485565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,balanced,0.054698665936787925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,power_law_1.01,0.08700799942016602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,balanced,0.05489600201447805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,power_law_1.01,0.09366400241851806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,balanced,0.07029866675535838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,power_law_1.01,0.06033920049667359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,balanced,0.05465066432952881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,power_law_1.01,0.09601920247077941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,balanced,0.07016533116499583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,power_law_1.01,0.06102399826049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,balanced,0.05573866764704386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,power_law_1.01,0.10319360494613647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,power_law_1.01,0.06190720200538635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,balanced,0.5298240184783936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,balanced,0.05622933308283488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,balanced,0.07326933244864146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,power_law_1.01,0.11800320148468017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,balanced,0.056976000467936196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,power_law_1.01,0.12700799703598023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,power_law_1.01,0.06245120167732239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,balanced,0.07805333534876506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,balanced,0.05823466678460439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,power_law_1.01,0.1362496018409729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,power_law_1.01,0.06353279948234558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,balanced,0.0598826656738917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,balanced,0.08425600330034892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,power_law_1.01,0.165555202960968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,power_law_1.01,0.06636160016059875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,balanced,0.060821334520975746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,power_law_1.01,0.21984000205993653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,power_law_1.01,0.07189120054244995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,balanced,0.09303999940554301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,power_law_1.01,0.21783039569854737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,power_law_1.01,0.07645440101623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,power_law_1.01,0.31340799331665037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,balanced,0.10035199920336406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,power_law_1.01,0.07745280265808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,power_law_1.01,0.38137600421905515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,power_law_1.01,0.09045760035514831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,balanced,0.06658666829268138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,power_law_1.01,0.5586304187774658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,power_law_1.01,0.0991487979888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,balanced,0.12890133261680603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,balanced,0.06683200101057689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,power_law_1.01,0.6599616050720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,power_law_1.01,0.11561599969863892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,power_law_1.01,0.8476096153259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,power_law_1.01,0.1296704053878784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,balanced,0.14749866724014282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,power_law_1.01,1.327500820159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,power_law_1.01,0.17709439992904663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,power_law_1.01,2.770809555053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,power_law_1.01,0.20067200660705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,balanced,0.8089173634847006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,power_law_1.01,0.29217278957366943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,power_law_1.01,0.02940160036087036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,balanced,0.19988799095153809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,balanced,0.07133333384990692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,power_law_1.01,0.3633471965789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,power_law_1.01,0.031071999669075014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,power_law_1.01,0.03699199855327606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,power_law_1.01,0.5060351848602295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,balanced,0.07943999767303467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,power_law_1.01,0.041171199083328246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,power_law_1.01,0.6300096035003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,balanced,0.08262399832407634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,balanced,0.2464746634165446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,power_law_1.01,0.05229439735412598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,power_law_1.01,0.8705535888671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,power_law_1.01,0.052243202924728394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,power_law_1.01,1.475430393218994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,power_law_1.01,0.05398399829864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,balanced,0.10107733805974324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,power_law_1.01,2.5118080139160157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,power_law_1.01,0.05756160020828247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,balanced,0.11197333534558614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,power_law_1.01,0.058739197254180905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,balanced,0.3524426619211833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,power_law_1.01,0.06133120059967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,balanced,0.1508799990018209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,power_law_1.01,0.06407679915428162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,power_law_1.01,0.06812800168991089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,balanced,0.17760533094406128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,power_law_1.01,0.07420160174369812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,balanced,0.4443519910176595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,power_law_1.01,0.07671679854393006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,8,power_law_1.2,0.05013759732246399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,8,power_law_1.2,0.03329919874668121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,power_law_1.01,0.07921280264854431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,8,power_law_1.2,0.0354559987783432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,balanced,0.25964800516764325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,power_law_1.01,0.09150720238685608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,8,power_law_1.2,0.044556799530982974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,power_law_1.01,0.10929919481277466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,8,power_law_1.2,0.04620159864425659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,8,power_law_1.2,0.06698880195617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,8,power_law_1.2,0.07060480117797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,power_law_1.01,0.1320896029472351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,balanced,1.5410292943318684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,8,power_law_1.2,0.07475839853286743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,power_law_1.01,0.15867520570755006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,balanced,0.33981335163116455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,8,power_law_1.2,0.07394559979438782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,power_law_1.01,0.2072767972946167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,balanced,0.5557013352711996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,8,power_law_1.2,0.07555199861526489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,power_law_1.01,0.2694272041320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,8,power_law_1.2,0.08072320222854615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,8,power_law_1.2,0.08190720081329346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,power_law_1.01,0.3912384033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,8,power_law_1.2,0.08291839957237243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,power_law_1.01,0.5933119773864746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,8,power_law_1.2,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,power_law_1.01,0.7706624031066894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,balanced,0.49851731459299725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,8,power_law_1.2,0.09722880125045777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,power_law_1.01,1.113260841369629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,8,power_law_1.2,0.09573760032653808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,8,power_law_1.2,0.10889600515365601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,power_law_1.01,1.4171072006225587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,8,power_law_1.2,0.11961599588394164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,power_law_1.01,2.3565120697021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,8,power_law_1.2,0.13730560541152953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,8,power_law_1.2,0.14621440172195435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,power_law_1.01,4.024044799804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,8,power_law_1.2,0.1852671980857849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,balanced,0.65611732006073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,8,power_law_1.2,0.23868799209594727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,balanced,0.845749298731486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,8,power_law_1.2,0.2264319896697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,8,power_law_1.2,0.3496448040008545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,8,power_law_1.2,0.4157567977905273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,8,power_law_1.2,0.702016019821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,8,power_law_1.2,0.8335616111755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,8,power_law_1.2,1.0838144302368165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,8,power_law_1.2,1.7178176879882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,8,power_law_1.2,4.963724899291992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,balanced,0.8131360212961832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,8,power_law_1.2,0.040089601278305055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,8,power_law_1.2,0.03383040130138397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,8,power_law_1.2,0.03322240114212036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,8,power_law_1.2,0.039577600359916684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,8,power_law_1.2,0.04356479942798615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,8,power_law_1.2,0.05653759837150574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,8,power_law_1.2,0.05953279733657837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,8,power_law_1.2,0.060153597593307497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,8,power_law_1.2,0.05947520136833191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,8,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,8,power_law_1.2,0.06272640228271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,balanced,1.2752959728240967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,8,power_law_1.2,0.06272000074386597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,8,power_law_1.2,0.06663039922714234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,8,power_law_1.2,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,8,power_law_1.2,0.07505279779434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,8,power_law_1.2,0.07592319846153259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,balanced,1.620698610941569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,8,power_law_1.2,0.08261119723320007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,8,power_law_1.2,0.09221760034561158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,8,power_law_1.2,0.10700800418853759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,8,power_law_1.2,0.125164794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,8,power_law_1.2,0.14216320514678954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,8,power_law_1.2,0.20322558879852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,8,power_law_1.2,0.23752961158752442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,8,power_law_1.2,0.3181119918823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,8,power_law_1.2,0.031219199299812317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,8,power_law_1.2,0.3964927911758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,8,power_law_1.2,0.029760000109672547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,8,power_law_1.2,0.7467135906219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,8,power_law_1.2,0.03281919956207276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,8,power_law_1.2,0.8033663749694824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,8,power_law_1.2,0.03625600039958954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,8,power_law_1.2,1.0742527961730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,8,power_law_1.2,0.03919360041618347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,8,power_law_1.2,0.05247359871864319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,8,power_law_1.2,1.8852415084838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,8,power_law_1.2,0.05503360033035278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,8,power_law_1.2,3.8599998474121096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,8,power_law_1.2,0.0551360011100769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,8,power_law_1.2,0.056006401777267456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,8,power_law_1.2,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,8,power_law_1.2,0.06074879765510559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,8,power_law_1.2,0.062003201246261595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,balanced,0.02477866659561793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,balanced,2.5124853452046714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,8,power_law_1.2,0.06453760266304016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,balanced,0.026288000245889027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,8,power_law_1.2,0.06930559873580933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,balanced,0.03458133339881897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,balanced,0.04757333298524221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,8,power_law_1.2,0.07817599773406983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,balanced,0.0765119989713033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,8,power_law_1.2,0.0818880021572113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,balanced,0.07530666887760162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,balanced,0.07718400160471599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,balanced,0.07790933549404144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,8,power_law_1.2,0.08507519960403442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,balanced,0.07566933333873749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,8,power_law_1.2,0.10176000595092774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,balanced,0.07603199779987335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,8,power_law_1.2,0.12455040216445923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,balanced,0.0794293334086736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,balanced,0.031983998914559685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,balanced,0.08072000245253245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,8,power_law_1.2,0.14086400270462035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,balanced,0.03092266619205475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,balanced,0.08212799827257793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,balanced,0.03229333211978277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,8,power_law_1.2,0.18651520013809203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,balanced,0.04025600105524063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,balanced,0.08411199847857158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,balanced,0.060229331254959106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,8,power_law_1.2,0.24917759895324706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,balanced,0.08911466598510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,balanced,0.06205333272616068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,8,power_law_1.2,0.3596287965774536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,balanced,0.061621333161989846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,balanced,0.09088533123334248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,balanced,0.061834668119748436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,balanced,0.09587732950846355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,balanced,0.06309333443641663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,8,power_law_1.2,0.5721663951873779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,balanced,0.06418666740258534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,balanced,0.10307199756304423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,balanced,0.06517333288987477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,8,power_law_1.2,0.6057792186737061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,balanced,0.06604800124963124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,balanced,0.11537599563598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,balanced,0.06850133339564006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,8,power_law_1.2,0.9874303817749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,balanced,0.07379733522733052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,balanced,0.12517866492271423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,balanced,0.07435200115044911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,8,power_law_1.2,1.4759167671203612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,balanced,0.08125866452852885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,8,power_law_1.2,1.6818111419677735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,balanced,0.13267733653386435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,balanced,0.08773866295814514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,balanced,0.09275199969609578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,8,power_law_1.2,3.14150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,balanced,0.1646453340848287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,balanced,0.10711466272672017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,8,power_law_1.2,7.559724426269531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,balanced,0.11941867073376973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,balanced,0.030906667311986286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,balanced,0.19089066982269287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,balanced,0.15416533748308817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,balanced,0.03178666780392329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,balanced,0.03303466737270355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,balanced,0.04020266731580099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,balanced,0.26420267422993976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,balanced,0.1823199987411499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,balanced,0.056277334690093994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,power_law_1.01,0.030323201417922975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,balanced,0.05778666834036509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,balanced,0.059194669127464294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,power_law_1.01,0.031167998909950256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,balanced,0.059808000922203064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,balanced,0.2564799984296163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,power_law_1.01,0.035692799091339114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,balanced,0.3137600024541219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,power_law_1.01,0.04181120097637177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,power_law_1.01,0.053439998626708986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,balanced,0.06221333146095276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,balanced,0.06341866652170818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,power_law_1.01,0.06919040083885193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,balanced,0.33429865042368573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,balanced,0.06576533118883769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,power_law_1.01,0.06884480118751526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,balanced,0.06782933572928111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,power_law_1.01,0.07269120216369629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,balanced,0.45898131529490155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,power_law_1.01,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,power_law_1.01,0.07482240200042725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,power_law_1.01,0.08097280263900757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,power_law_1.01,0.08388479948043823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,balanced,0.07637866834799449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,balanced,0.4927146832148234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,power_law_1.01,0.08127359747886657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,balanced,0.07718400160471599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,power_law_1.01,0.08740479946136474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,power_law_1.01,0.09214720129966736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,power_law_1.01,0.09702399969100953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,balanced,0.578933318456014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,power_law_1.01,0.10138880014419556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,power_law_1.01,0.12159359455108643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,power_law_1.01,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,power_law_1.01,0.13208320140838622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,power_law_1.01,0.03208320140838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,power_law_1.01,0.14991999864578248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,balanced,0.08490133285522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,power_law_1.01,0.03340800106525421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,balanced,0.6421813170115153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,power_law_1.01,0.16531840562820435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,power_law_1.01,0.04036479890346527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,balanced,0.0983679989973704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,power_law_1.01,0.2034048080444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,power_law_1.01,0.043321600556373595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,power_law_1.01,0.2331775903701782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,power_law_1.01,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,balanced,0.10407466689745586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,power_law_1.01,0.3266815900802612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,power_law_1.01,0.059443199634552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,power_law_1.01,0.0606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,power_law_1.01,0.4474175930023193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,power_law_1.01,0.06135680079460144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,power_law_1.01,0.5561791896820069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,balanced,0.7225120067596436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,power_law_1.01,0.061299198865890504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,power_law_1.01,0.7440832138061524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,power_law_1.01,0.06406400203704835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,balanced,0.13050132989883423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,power_law_1.01,0.8494336128234863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,power_law_1.01,0.06693120002746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,power_law_1.01,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,power_law_1.01,1.4198399543762208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,balanced,0.14711466431617737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,balanced,0.7966933250427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,power_law_1.01,0.07010560035705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,power_law_1.01,0.07736319899559022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,power_law_1.01,2.7508672714233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,power_law_1.01,0.07811840176582337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,balanced,0.22365866104761759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,power_law_1.01,0.08390399813652039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,power_law_1.01,0.0932096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,power_law_1.01,0.1055232048034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,balanced,0.2772960066795349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,power_law_1.01,0.12879999876022338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,power_law_1.01,0.1484544038772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,power_law_1.01,0.19127039909362792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,power_law_1.01,0.22741119861602782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,balanced,0.39828264713287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,power_law_1.01,0.30616960525512693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,power_law_1.01,0.4259456157684326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,balanced,1.0833813349405925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,power_law_1.01,0.5608511924743652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,4,power_law_1.2,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,power_law_1.01,0.7805376052856445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,power_law_1.01,0.03223679959774017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,balanced,0.5155359903971354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,4,power_law_1.2,0.02895359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,balanced,1.2358400026957195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,power_law_1.01,0.94900484085083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,power_law_1.01,0.0332863986492157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,4,power_law_1.2,0.03504000008106232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,power_law_1.01,1.676678466796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,power_law_1.01,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,4,power_law_1.2,0.040608000755310056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,power_law_1.01,0.040320000052452086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,4,power_law_1.2,0.049439999461174014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,power_law_1.01,3.3712448120117187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,power_law_1.01,0.04248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,4,power_law_1.2,0.06593279838562012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,power_law_1.01,0.05576320290565491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,4,power_law_1.2,0.07278720140457154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,power_law_1.01,0.05658239722251892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,balanced,0.7620533307393392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,4,power_law_1.2,0.07628160119056701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,power_law_1.01,0.05862399935722351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,4,power_law_1.2,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,power_law_1.01,0.06072319746017456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,4,power_law_1.2,0.0793727993965149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,power_law_1.01,0.06139519810676575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,power_law_1.01,0.0633408010005951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,4,power_law_1.2,0.08145920038223267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,power_law_1.01,0.06794880032539367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,4,power_law_1.2,0.08085119724273682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,power_law_1.01,0.07156479954719544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,4,power_law_1.2,0.08423680067062378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,power_law_1.01,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,balanced,1.00326935450236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,4,power_law_1.2,0.08668799996376038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,4,power_law_1.2,0.0920639991760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,4,power_law_1.2,0.09667199850082397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,power_law_1.01,0.08440960049629212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,4,power_law_1.2,0.10665600299835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,power_law_1.01,0.08976640105247498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,4,power_law_1.2,0.12528640031814575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,4,power_law_1.2,0.13341439962387086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,4,power_law_1.2,0.15736960172653197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,power_law_1.01,0.0930239975452423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,4,power_law_1.2,0.17927039861679078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,4,power_law_1.2,0.22768640518188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,power_law_1.01,0.11388800144195557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,balanced,2.127290725708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,4,power_law_1.2,0.24749441146850587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,power_law_1.01,0.12356480360031127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,balanced,1.2451999982198079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,4,power_law_1.2,0.3640448093414307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,balanced,2.3310133616129556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,power_law_1.01,0.15463039875030518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,4,power_law_1.2,0.47603840827941896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,power_law_1.01,0.19916800260543824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,4,power_law_1.2,0.6243904113769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,4,power_law_1.2,0.03558399975299835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,power_law_1.01,0.27618560791015623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,4,power_law_1.2,0.8785152435302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,4,power_law_1.2,0.03173120021820068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,power_law_1.01,0.3634047985076904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,4,power_law_1.2,1.2076416015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,4,power_law_1.2,0.033164799213409424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,power_law_1.01,0.5424255847930908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,4,power_law_1.2,1.8108671188354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,4,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,power_law_1.01,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,4,power_law_1.2,0.04316799938678741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,power_law_1.01,1.0783679962158204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,4,power_law_1.2,3.953113555908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,4,power_law_1.2,0.05864959955215454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,power_law_1.01,1.347231960296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,4,power_law_1.2,0.05974400043487549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,power_law_1.01,1.50316162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,4,power_law_1.2,0.05964159965515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,4,power_law_1.2,0.062067198753356936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,power_law_1.01,2.662713623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,4,power_law_1.2,0.061868798732757566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,balanced,1.9534826278686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,4,power_law_1.2,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,power_law_1.01,5.6162879943847654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,4,power_law_1.2,0.06751999855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,4,power_law_1.2,0.0683135986328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,4,power_law_1.2,0.06974719762802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,4,power_law_1.2,0.07827839851379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,4,power_law_1.2,0.08112639784812928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,4,power_law_1.2,0.08605440258979798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,4,power_law_1.2,0.09811840057373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,4,power_law_1.2,0.106387197971344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,4,power_law_1.2,0.13122559785842897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,4,power_law_1.2,0.14639999866485595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,4,power_law_1.2,0.19920639991760253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,4,power_law_1.2,0.24113280773162843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,4,power_law_1.2,0.3324671983718872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,4,power_law_1.2,0.4219776153564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,4,power_law_1.2,0.7320064067840576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,4,power_law_1.2,0.945849609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,4,power_law_1.2,1.0487296104431152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,4,power_law_1.2,1.8532543182373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,4,power_law_1.2,3.9716991424560546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,balanced,3.838085174560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,4,power_law_1.2,0.03209599852561951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,4,power_law_1.2,0.032492798566818235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,4,power_law_1.2,0.03370879888534546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,4,power_law_1.2,0.03866879940032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,4,power_law_1.2,0.04186240136623383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,4,power_law_1.2,0.05671679973602295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,4,power_law_1.2,0.05756160020828247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,4,power_law_1.2,0.058764797449111936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,4,power_law_1.2,0.06147199869155884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,4,power_law_1.2,0.06286720037460328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,4,power_law_1.2,0.0662015974521637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,4,power_law_1.2,0.06863359808921814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,4,power_law_1.2,0.07211520075798035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,balanced,0.02566933383544286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,4,power_law_1.2,0.07672960162162781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,balanced,0.027530667682488758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,balanced,0.03156800071398417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,4,power_law_1.2,0.08352000117301941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,balanced,0.050554667909940086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,4,power_law_1.2,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,balanced,0.076773335536321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,balanced,0.07997333506743114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,balanced,0.0806879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,4,power_law_1.2,0.0943231999874115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,balanced,0.07993066807587941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,balanced,0.08124800026416779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,4,power_law_1.2,0.11750400066375732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,balanced,0.08116800089677174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,4,power_law_1.2,0.1253119945526123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,balanced,0.0832479993502299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,balanced,0.08447999755541484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,4,power_law_1.2,0.15865600109100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,balanced,0.08615466952323914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,4,power_law_1.2,0.20994560718536376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,balanced,0.08774933218955994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,4,power_law_1.2,0.3166975975036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,balanced,0.09473066528638203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,4,power_law_1.2,0.4111616134643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,4,power_law_1.2,0.5860095977783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,balanced,0.10018133123715718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,4,power_law_1.2,0.7608704090118408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,balanced,0.10582933823267619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,4,power_law_1.2,1.151244831085205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,balanced,0.11840533216794331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,4,power_law_1.2,1.6916351318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,balanced,0.12829333543777466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,4,power_law_1.2,2.048748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,balanced,0.15414933363596597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,4,power_law_1.2,3.3372161865234373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,balanced,0.16551466782887778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,4,power_law_1.2,6.952435302734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,balanced,0.034048000971476235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,balanced,0.21547200282414755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,balanced,0.03236266722281774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,balanced,0.0348693331082662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,balanced,0.04473066826661428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,balanced,0.06423466900984447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,balanced,0.26251200834910077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,balanced,0.0664106657107671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,balanced,0.0666720022757848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,balanced,0.06603200236956279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,balanced,0.06855999926726024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,balanced,0.36353600025177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,balanced,0.0689386675755183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,balanced,0.041146665811538696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,balanced,0.06939733525117238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,power_law_1.01,0.02881920039653778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,balanced,0.07175466914971669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,balanced,0.042810668547948204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,balanced,0.07337599992752075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,power_law_1.01,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,balanced,0.043552001317342125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,power_law_1.01,0.03194240033626557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,balanced,0.07709866762161255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,balanced,0.47393067677815753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,balanced,0.050767997900644936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,power_law_1.01,0.04356479942798615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,balanced,0.08309866487979889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,balanced,0.0676746666431427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,balanced,0.08577066659927368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,power_law_1.01,0.049055999517440795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,balanced,0.07037333150704701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,power_law_1.01,0.0701632022857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,power_law_1.01,0.03656960129737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,balanced,0.07167466481526692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,balanced,0.09510933359464009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,power_law_1.01,0.07163519859313965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,balanced,0.0728959987560908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,balanced,0.10866133371988933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,power_law_1.01,0.03164800107479095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,balanced,0.07346666852633159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,power_law_1.01,0.07303680181503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,balanced,0.07470933099587758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,power_law_1.01,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,balanced,0.7282986640930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,balanced,0.1151626706123352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,power_law_1.01,0.0769599974155426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,balanced,0.07726933558781941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,power_law_1.01,0.04159359931945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,power_law_1.01,0.07919999957084656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,balanced,0.13900267084439596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,balanced,0.08154666423797607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,power_law_1.01,0.045664000511169436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,power_law_1.01,0.08515840172767639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,balanced,0.0835040012995402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,power_law_1.01,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,power_law_1.01,0.08966400027275086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,balanced,0.15466666221618652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,balanced,0.08658666412035625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,power_law_1.01,0.06199679970741272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,power_law_1.01,0.09635840058326721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,power_law_1.01,0.06448000073432922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,power_law_1.01,0.09468160271644592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,balanced,0.2153706749280294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,power_law_1.01,0.06628479957580566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,power_law_1.01,0.0997759997844696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,power_law_1.01,0.06760960221290588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,balanced,0.9280320008595785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,power_law_1.01,0.1030784010887146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,balanced,0.09886933366457622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,power_law_1.01,0.07027199864387512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,balanced,0.2629653414090474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,power_law_1.01,0.12061439752578736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,power_law_1.01,0.07552000284194946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,balanced,0.10011200110117595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,power_law_1.01,0.1318336009979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,power_law_1.01,0.07837439775466919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,power_law_1.01,0.14074239730834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,power_law_1.01,0.08156160116195679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,power_law_1.01,0.17969919443130494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,balanced,0.37936532497406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,power_law_1.01,0.0896448016166687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,power_law_1.01,0.18256640434265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,power_law_1.01,0.09439359903335572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,power_law_1.01,0.24078719615936278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,power_law_1.01,0.10255359411239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,balanced,0.11585600177447002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,power_law_1.01,0.28646399974823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,power_law_1.01,0.11914240121841431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,power_law_1.01,0.39061119556427004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,balanced,0.1386293371518453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,power_law_1.01,0.13409919738769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,balanced,0.5147519906361898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,balanced,1.1436853408813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,power_law_1.01,0.4830848217010498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,power_law_1.01,0.15602560043334962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,balanced,0.14702399571736655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,power_law_1.01,0.7635392189025879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,power_law_1.01,0.1869696021080017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,power_law_1.01,0.2440256118774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,power_law_1.01,0.9787839889526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,power_law_1.01,0.2950079917907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,power_law_1.01,1.243398380279541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,balanced,0.20712000131607056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,power_law_1.01,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,power_law_1.01,1.908768081665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,balanced,0.793077309926351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,2,power_law_1.2,0.02781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,power_law_1.01,0.5838399887084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,balanced,0.2571679949760437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,power_law_1.01,0.8308159828186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,2,power_law_1.2,0.02812800109386444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,power_law_1.01,4.227865600585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,2,power_law_1.2,0.030323201417922975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,power_law_1.01,1.0759167671203613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,2,power_law_1.2,0.04111360013484955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,power_law_1.01,0.038489601016044615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,balanced,0.37959468364715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,power_law_1.01,1.4265536308288573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,2,power_law_1.2,0.04827519953250885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,power_law_1.01,0.0418368011713028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,2,power_law_1.2,0.06766080260276794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,power_law_1.01,2.256780815124512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,power_law_1.01,0.04457600116729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,2,power_law_1.2,0.07236480116844177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,2,power_law_1.2,0.07438719868659974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,balanced,0.45953067143758136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,power_law_1.01,0.049344000220298764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,power_law_1.01,4.546105575561524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,2,power_law_1.2,0.08014079928398132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,balanced,1.0518559614817302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,power_law_1.01,0.05299199819564819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,balanced,1.8125759760538738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,2,power_law_1.2,0.08302720189094544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,power_law_1.01,0.06510720252990723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,2,power_law_1.2,0.08791040182113648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,2,power_law_1.2,0.09464319944381713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,power_law_1.01,0.0682752013206482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,balanced,0.6706079641977946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,2,power_law_1.2,0.10474239587783814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,power_law_1.01,0.07079039812088013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,2,power_law_1.2,0.09441919922828675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,2,power_law_1.2,0.10059520006179809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,power_law_1.01,0.0720255970954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,2,power_law_1.2,0.10452480316162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,power_law_1.01,0.07486079931259156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,2,power_law_1.2,0.12314879894256592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,power_law_1.01,0.08084480166435241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,2,power_law_1.2,0.13505280017852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,balanced,0.8768959840138754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,2,power_law_1.2,0.1447872042655945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,power_law_1.01,0.085452800989151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,2,power_law_1.2,0.17193599939346313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,power_law_1.01,0.08869119882583618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,2,power_law_1.2,0.1865664005279541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,balanced,1.3129226366678874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,power_law_1.01,0.09653760194778442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,2,power_law_1.2,0.24321279525756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,2,power_law_1.2,0.2931648015975952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,2,power_law_1.2,0.3926912069320679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,power_law_1.01,0.10741759538650512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,2,power_law_1.2,0.5558464050292968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,power_law_1.01,0.11509120464324951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,balanced,1.2987199624379475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,2,power_law_1.2,0.810086441040039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,2,power_law_1.2,1.1043392181396485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,2,power_law_1.2,1.3921536445617675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,power_law_1.01,0.12273279428482056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,2,power_law_1.2,2.1219072341918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,power_law_1.01,0.1455296039581299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,power_law_1.01,0.1827008008956909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,power_law_1.2,4.5604095458984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,power_law_1.01,0.24033279418945314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,balanced,1.7160320281982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,power_law_1.01,0.29562880992889407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,power_law_1.01,0.4204415798187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,balanced,2.072709401448568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,power_law_1.01,0.5239999771118165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,power_law_1.01,0.7550208091735839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,power_law_1.01,0.9894783973693848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,2,power_law_1.2,0.03668479919433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,2,balanced,3.3285013834635415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,power_law_1.01,1.475820827484131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,2,power_law_1.2,0.03187200129032135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,power_law_1.01,1.950035285949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,2,power_law_1.2,0.035872000455856326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,2,power_law_1.2,0.041094401478767396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,power_law_1.01,2.453971290588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,balanced,2.1362133026123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,2,power_law_1.2,0.043961599469184875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,2,power_law_1.2,0.06239359974861145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,power_law_1.01,3.721209716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,2,power_law_1.2,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,2,power_law_1.2,0.06458240151405334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,2,power_law_1.2,0.06664959788322448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,power_law_1.01,7.612486267089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,2,power_law_1.2,0.06855679750442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,2,power_law_1.2,0.07279999852180481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,2,power_law_1.2,0.07804160118103028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,2,power_law_1.2,0.08060160279273987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,2,power_law_1.2,0.08273919820785522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,2,power_law_1.2,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,2,power_law_1.2,0.09271039962768554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,2,power_law_1.2,0.10304000377655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,2,power_law_1.2,0.11905920505523682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,2,power_law_1.2,0.13475199937820434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,2,power_law_1.2,0.1605247974395752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,2,power_law_1.2,0.18904320001602173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,2,power_law_1.2,0.2505215883255005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,balanced,3.3754612604777017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,2,power_law_1.2,0.3164736032485962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,2,power_law_1.2,0.45635199546813965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,2,power_law_1.2,0.6126143932342529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,2,power_law_1.2,0.8803071975708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,balanced,3.8687146504720054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,2,power_law_1.2,1.2458751678466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,2,power_law_1.2,1.5213631629943847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,2,power_law_1.2,2.2362239837646483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,2,power_law_1.2,4.6687744140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,balanced,6.637205123901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,balanced,0.044693330923716225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,balanced,0.05409066875775655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,balanced,0.0735999991496404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,balanced,0.12827733159065247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,2,power_law_1.2,0.03864319920539856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,balanced,0.2265333334604899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,2,power_law_1.2,0.04005120098590851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,2,power_law_1.2,0.04405759871006012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,balanced,0.22712000211079916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,2,power_law_1.2,0.04842880070209503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,2,power_law_1.2,0.052288001775741576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,balanced,0.22835199038187662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,2,power_law_1.2,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,2,power_law_1.2,0.06814720034599304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,balanced,0.22738667329152426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,2,power_law_1.2,0.0717631995677948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,balanced,0.22726933161417642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,2,power_law_1.2,0.07468159794807434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,balanced,0.22779732942581177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,2,power_law_1.2,0.07653120160102844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,balanced,0.22924800713857016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,2,power_law_1.2,0.08153600096702576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,balanced,0.23176000515619913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,2,power_law_1.2,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,balanced,0.2326293389002482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,2,power_law_1.2,0.08906239867210389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,balanced,0.23836266994476318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,2,power_law_1.2,0.09902719855308532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,balanced,0.24337599674860635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,balanced,0.2450559933980306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,2,power_law_1.2,0.10994559526443481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,balanced,0.03658666710058848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,balanced,0.25128533442815143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,2,power_law_1.2,0.11564160585403442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,balanced,0.03997333347797394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,balanced,0.2568853298823039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,balanced,0.05565333366394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,balanced,0.08376000324885051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,2,power_law_1.2,0.12300159931182861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,balanced,0.13170133034388223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,balanced,0.2706720034281413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,balanced,0.13352533181508383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,2,power_law_1.2,0.14702080488204955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,balanced,0.2828426758448283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,balanced,0.1349546710650126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,2,power_law_1.2,0.1726591944694519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,balanced,0.13552000125249228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,balanced,0.3074986735979716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,2,power_law_1.2,0.24797439575195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,balanced,0.13648533821105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,balanced,0.13665067156155905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,2,power_law_1.2,0.3187328100204468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,balanced,0.3437173366546631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,balanced,0.13863466183344522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,2,power_law_1.2,0.42598400115966795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,balanced,0.13934933145840964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,2,power_law_1.2,0.5407872200012207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,balanced,0.14099199573198953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,balanced,0.37062398592631024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,2,power_law_1.2,0.7639423847198487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,balanced,0.14338666200637817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,2,power_law_1.2,1.0438464164733887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,balanced,0.15014933546384177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.12278399467468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,2,power_law_1.2,1.524300765991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,balanced,0.15147733688354492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,balanced,0.4854400157928467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,balanced,0.031498665610949196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,balanced,0.15530133247375488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,2,power_law_1.2,2.0210432052612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.0680512011051178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,balanced,0.03576533248027166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.08044160008430482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,balanced,0.16520532965660095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,2,power_law_1.2,2.634252738952637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,balanced,0.05165866514046987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.1014143943786621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,balanced,0.07921599845091502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,balanced,0.17577600479125977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.1446336030960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,2,power_law_1.2,4.781433486938477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,balanced,0.1264479955037435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.1994047999382019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,balanced,0.6175839900970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,balanced,0.19323732455571493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,balanced,0.12846933801968893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.2120448112487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,balanced,0.1301653285821279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,2,power_law_1.2,9.607917022705077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.21173760890960694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,balanced,0.21441600720087686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,balanced,0.1297706663608551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.21714560985565184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.22369918823242188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,balanced,0.13149333000183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.23277440071105956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,balanced,0.13290666540463766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,balanced,0.2624640067418416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.23814399242401124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,balanced,0.13392000397046408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.24997758865356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,balanced,0.8610560099283854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,balanced,0.1358453333377838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.23786239624023436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,balanced,0.13943466544151306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,balanced,0.29655466477076214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.25959680080413816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,balanced,0.14171199997266135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.28312320709228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.26368639469146726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.2993920087814331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,balanced,0.40251731872558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.01,0.32433280944824217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.01,0.36960639953613283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.01,0.07891839742660522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,balanced,0.14899733662605286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.01,0.41312642097473146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.01,0.05986559987068176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,balanced,0.15065067013104758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.01,0.4891712188720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,balanced,1.1141280333201091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.01,0.5746880054473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.01,0.06279039978981019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,balanced,0.49141331513722736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.01,0.8307135581970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,power_law_1.01,0.07813760042190551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.01,0.07651200294494628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.01,0.9542783737182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.01,0.08675199747085571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,power_law_1.01,0.048153600096702574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.01,1.5003392219543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.01,0.11713279485702514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.01,1.9101823806762694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.01,0.12126719951629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,power_law_1.01,0.07326719760894776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.01,2.437107276916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,power_law_1.01,0.08924800157546997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.01,0.13431040048599244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.01,3.399020767211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,balanced,0.6978826522827148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,power_law_1.01,0.12402559518814087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.01,0.13167359828948974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,balanced,0.15996799866358438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,power_law_1.01,0.1263360023498535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.01,0.13288320302963258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.01,7.147942352294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,balanced,0.17586666345596313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,power_law_1.01,0.1295040011405945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.01,0.13573119640350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,balanced,1.3991200129191081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,power_law_1.01,0.13385599851608276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,balanced,0.18502400318781534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.01,0.14201600551605226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,power_law_1.01,0.13477760553359985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,balanced,0.2140586574872335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.01,0.14812159538269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,power_law_1.01,0.1451200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,power_law_1.01,0.1466431975364685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.01,0.14387199878692628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,balanced,0.23647467295328775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,power_law_1.01,0.15532159805297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.01,0.14675840139389038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,balanced,0.9062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,power_law_1.01,0.16273280382156372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.01,0.1666111946105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,balanced,0.3391306797663371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.01,0.164902400970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.01,0.19006719589233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,power_law_1.01,0.1752832055091858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,balanced,0.3954559961954753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.01,0.1977023959159851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,power_law_1.01,0.17921919822692872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.11726080179214478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.01,0.24176640510559083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.06136959791183472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.01,0.28275840282440184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.07584000229835511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,power_law_1.01,0.18776960372924806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.01,0.36044158935546877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,balanced,0.5672906637191772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.10254080295562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,power_law_1.01,0.21427199840545655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.01,0.4257664203643799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.1250175952911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,balanced,1.1307466824849446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.01,0.25528318881988527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,balanced,2.1615467071533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.01,0.5970304012298584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.19964799880981446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.01,0.32228479385375974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.01,0.6871168136596679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.21018240451812745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.01,0.38259201049804686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,balanced,0.7484959761301676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.22288639545440675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.01,1.0109248161315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.01,0.5518208026885987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.22322559356689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.01,1.5049728393554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.01,0.6400447845458984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.22581119537353517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.01,1.0760448455810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.01,1.7082048416137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.24299519062042235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.01,1.2342464447021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.2502079963684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.01,2.9622528076171877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,balanced,1.1112213134765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.01,1.983558464050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.2481920003890991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.2234816074371338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.01,5.670188903808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.01,2.914374351501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.2650559902191162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,power_law_1.01,3.5917823791503904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.29348480701446533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.28008959293365476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,power_law_1.01,4.740639877319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,balanced,1.7284746170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,8,power_law_1.2,0.3308288097381592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,8,power_law_1.2,0.34281599521636963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,power_law_1.01,10.079296112060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,balanced,1.4685546557108562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,8,power_law_1.2,0.4063551902770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,8,power_law_1.2,0.4561215877532959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,8,power_law_1.2,0.5117119789123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,8,power_law_1.2,0.7260863780975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,8,power_law_1.2,0.9317631721496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,8,power_law_1.2,1.432147216796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,8,power_law_1.2,1.901728057861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,8,power_law_1.2,2.256857681274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,balanced,1.818618615468343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,8,power_law_1.2,3.323334503173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,8,power_law_1.2,4.404563140869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,balanced,3.9312426249186196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,8,power_law_1.2,11.91562271118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,balanced,2.886410713195801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,balanced,3.346207936604818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.07939199805259704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.04426240026950836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.0599295973777771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.06414080262184144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.08241919875144958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.11991679668426514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.12651519775390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.13338880538940429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.13461120128631593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.13553919792175292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.13920639753341674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.14266879558563234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.15982719659805297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.14906879663467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.1689087986946106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.17285120487213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.16724480390548707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.19942400455474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.21813759803771973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.2598207950592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.32603518962860106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,0.3918400049209595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,balanced,5.723690668741862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,8,power_law_1.2,0.07370240092277527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,0.47852158546447754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,8,power_law_1.2,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,0.704640007019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,8,power_law_1.2,0.05597440004348755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,0.9299072265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,8,power_law_1.2,0.06652160286903382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,8,power_law_1.2,0.07685760259628296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,1.334348773956299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,8,power_law_1.2,0.11880320310592651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,1.7319551467895509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,8,power_law_1.2,0.12522239685058595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,8,power_law_1.2,2.326579284667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,8,power_law_1.2,0.13274240493774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,8,power_law_1.2,0.13656959533691407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,8,power_law_1.2,3.322457504272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,8,power_law_1.2,0.13404799699783326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,8,power_law_1.2,0.1478976011276245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,8,power_law_1.2,0.15075839757919313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,8,power_law_1.2,9.404768371582032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,8,power_law_1.2,0.16072959899902345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,8,power_law_1.2,0.1636672019958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,8,power_law_1.2,0.17523839473724365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,8,power_law_1.2,0.19879679679870604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,balanced,0.0396373321612676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,8,power_law_1.2,0.19696639776229857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,balanced,0.05301333467165629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,balanced,0.07937600215276082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,8,power_law_1.2,0.23111679553985595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,balanced,0.12852799892425537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,balanced,0.22830933332443237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.2,0.28961279392242434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,balanced,0.22753065824508667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.2,0.3177151918411255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,balanced,0.22873600323994955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,balanced,0.22849067052205405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.2,0.4089791774749756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,balanced,0.2289066712061564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.2,0.6032000064849854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,balanced,0.2300693392753601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.2,0.7518976211547852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,balanced,0.2318720022837321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,balanced,0.033973333736260734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.2,1.107686424255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,balanced,0.2351626753807068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.2,1.5851391792297362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,balanced,0.03670933345953623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,balanced,0.2360373338063558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.2,2.568422317504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,balanced,0.24280534187952676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,balanced,0.08364799618721008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,balanced,0.2510026693344116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.2,3.6752513885498046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,balanced,0.25271467367808026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,balanced,0.1344533363978068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,8,power_law_1.2,4.2047168731689455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,balanced,0.2600053350130717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,balanced,0.13672533631324768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,balanced,0.26945600907007855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,8,power_law_1.2,7.445766448974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,balanced,0.13893866539001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,balanced,0.2876799901326497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,balanced,0.1388746698697408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,balanced,0.13962666193644205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,8,power_law_1.2,16.301881408691408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,balanced,0.30796800057093304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,balanced,0.1402346690495809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,balanced,0.1416320006052653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,balanced,0.3336106538772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,balanced,0.14452266693115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,balanced,0.14613333344459534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,balanced,0.38446935017903644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,balanced,0.1506186624368032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.01,0.07685120105743408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,balanced,0.15638400117556253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,balanced,0.4339146614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.01,0.06556159853935242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,balanced,0.15893866618474325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.01,0.06869760155677795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,balanced,0.16742400328318277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.01,0.09548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,balanced,0.5771093368530273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.01,0.12438399791717529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,balanced,0.1800373395284017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.01,0.19442559480667115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,balanced,0.1934559941291809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,balanced,0.03578133384386698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.01,0.21352319717407225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.01,0.0546176016330719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.01,0.2188352108001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,balanced,0.22023467222849527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.01,0.04705919921398163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,balanced,0.040133332212766014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,balanced,0.6981333096822103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.01,0.21250560283660888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.01,0.050732797384262084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,balanced,0.2504426638285319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,balanced,0.05345066885153452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.01,0.22254080772399903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.01,0.07427200078964233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.01,0.23023359775543212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,balanced,0.08156266808509827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.01,0.08786560297012329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.01,0.23137919902801513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,balanced,0.1295199990272522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,balanced,0.30948267380396527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.01,0.1192896008491516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.01,0.24061439037322999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.01,0.12182400226593018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,balanced,0.13277332981427512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.01,0.24499199390411378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.01,0.12828799486160278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,balanced,0.13521599769592285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,balanced,1.0069279670715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.01,0.25931520462036134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,balanced,0.3617013295491536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.01,0.13000960350036622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,balanced,0.13581333557764688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.01,0.2582207918167114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.01,0.13119360208511352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,balanced,0.1365226705869039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.01,0.2723392009735107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.01,0.13627519607543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,balanced,0.13917866349220276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.01,0.3012480020523071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.01,0.1417407989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,balanced,0.1416159967581431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,balanced,0.49369064966837567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.01,0.3278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.01,0.14334720373153687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,balanced,0.14407466848691305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.01,0.36430718898773196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.01,0.14672000408172609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,balanced,0.14760532975196838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.01,0.4163072109222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.01,0.15877120494842528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,balanced,0.15267733732859293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.01,0.48343682289123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.01,0.16224000453948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.01,0.5893248081207275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,balanced,1.2910133202870686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,balanced,0.617301344871521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.01,0.17337599992752076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.01,0.8370304107666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.01,0.1933184027671814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.01,1.0010560035705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.01,0.21487998962402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.01,1.3524415969848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.01,0.24735360145568847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,balanced,0.16261333227157593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.01,0.3020416021347046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.01,1.9173696517944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,balanced,0.16658133268356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.01,0.3671168088912964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.01,2.307334327697754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.01,0.4589824199676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,balanced,0.8961066404978434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.01,3.5258174896240235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.01,0.6390079975128173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.01,0.7775360107421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.01,7.512012481689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,balanced,1.6180639266967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.01,1.129702377319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.01,1.4441984176635743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,balanced,0.17999466260274252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.01,1.9674112319946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,balanced,0.2023786703745524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.01,2.991155242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,balanced,1.1934026877085369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,balanced,0.2158720095952352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.01,6.357350540161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,balanced,0.2823733290036519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,balanced,0.3274506727854411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,power_law_1.01,0.0584384024143219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,power_law_1.01,0.0527616024017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,balanced,0.4778933525085449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,power_law_1.01,0.05608959794044495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,4,power_law_1.2,0.07626879811286927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,power_law_1.01,0.07146239876747132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,balanced,0.5683306852976481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,4,power_law_1.2,0.05408639907836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,balanced,1.4716639518737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,balanced,2.5076319376627603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,power_law_1.01,0.08454399704933166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,4,power_law_1.2,0.07095680236816407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,power_law_1.01,0.11936000585556031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,4,power_law_1.2,0.09619839787483216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,4,power_law_1.2,0.11131520271301269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,power_law_1.01,0.12543359994888306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,balanced,0.820192019144694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,4,power_law_1.2,0.19270399808883668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,power_law_1.01,0.13214720487594606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,4,power_law_1.2,0.21578240394592285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,power_law_1.01,0.13786239624023439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,power_law_1.01,0.14095360040664673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,4,power_law_1.2,0.2146496057510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,power_law_1.01,0.1441856026649475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,4,power_law_1.2,0.22631680965423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,power_law_1.01,0.14940799474716188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,4,power_law_1.2,0.22835841178894042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,power_law_1.01,0.1532415986061096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,balanced,1.080357313156128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,power_law_1.01,0.1692479968070984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,4,power_law_1.2,0.2361920118331909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,4,power_law_1.2,0.248473596572876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,power_law_1.01,0.17974400520324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,4,power_law_1.2,0.2529920101165771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,power_law_1.01,0.19703680276870728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,4,power_law_1.2,0.2503232002258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,4,power_law_1.2,0.2628864049911499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,balanced,2.2804746627807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,balanced,1.5959146817525227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,power_law_1.01,0.20098559856414794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,4,power_law_1.2,0.2738624095916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,power_law_1.01,0.23982079029083253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,4,power_law_1.2,0.28292479515075686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,power_law_1.01,0.27093119621276857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,4,power_law_1.2,0.31099519729614256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,power_law_1.01,0.3631808042526245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,4,power_law_1.2,0.32436480522155764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,power_law_1.01,0.45183358192443845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,4,power_law_1.2,0.3816256046295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,power_law_1.01,0.5681791782379151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,power_law_1.01,0.7408768177032471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,4,power_law_1.2,0.44266881942749026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,4,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,power_law_1.01,1.1138624191284179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,4,power_law_1.2,0.5385280132293702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,balanced,2.1085920333862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,4,power_law_1.2,0.042368000745773314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,power_law_1.01,1.4755711555480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,4,power_law_1.2,0.6184512138366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,4,power_law_1.2,0.05200639963150024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,power_law_1.01,2.1528064727783205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,4,power_law_1.2,0.8385536193847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,4,power_law_1.2,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,power_law_1.01,3.1232320785522463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,4,power_law_1.2,0.08049280047416688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,4,power_law_1.2,1.0858240127563477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,power_law_1.01,3.4386878967285157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,4,power_law_1.2,0.11742719411849975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,4,power_law_1.2,1.7666048049926757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,power_law_1.01,5.745510482788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,4,power_law_1.2,0.12576639652252197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,balanced,5.03436279296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,4,power_law_1.2,0.12985600233078004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,4,power_law_1.2,2.2964672088623046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,4,power_law_1.2,0.13147519826889037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,power_law_1.01,10.843046569824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,4,power_law_1.2,2.793049621582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,4,power_law_1.2,0.12929279804229737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,4,power_law_1.2,0.1411967992782593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,balanced,2.634559949239095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,4,power_law_1.2,4.0508544921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,4,power_law_1.2,0.14211200475692748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,4,power_law_1.2,0.15082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,4,power_law_1.2,9.279289245605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,4,power_law_1.2,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,4,power_law_1.2,0.1564095973968506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,4,power_law_1.2,0.16580480337142944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,4,power_law_1.2,0.1794816017150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,4,power_law_1.2,0.1950592041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,balanced,4.464927991231282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,4,power_law_1.2,0.23080320358276368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,4,power_law_1.2,0.27162880897521974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,4,power_law_1.2,0.32239360809326173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,4,power_law_1.2,0.4579328060150146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,4,power_law_1.2,0.531660795211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,balanced,4.165738741556804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,4,power_law_1.2,0.6782015800476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,4,power_law_1.2,0.9231424331665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,4,power_law_1.2,1.3113280296325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,4,power_law_1.2,1.657369613647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,4,power_law_1.2,2.064204788208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,4,power_law_1.2,3.838156890869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,4,power_law_1.2,7.301331329345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,4,power_law_1.2,0.059033602476119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,4,power_law_1.2,0.04046719968318939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,4,power_law_1.2,0.04867840111255646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,4,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,balanced,0.04043733328580856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,4,power_law_1.2,0.08062080144882203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,balanced,0.052560001611709595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,balanced,0.07622933387756348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,4,power_law_1.2,0.12104320526123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,balanced,0.12868799765904745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,4,power_law_1.2,0.1283519983291626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,balanced,0.22631466388702393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,4,power_law_1.2,0.1351040005683899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,4,power_law_1.2,0.13783040046691894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,balanced,0.23164266347885132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,balanced,8.271231969197592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,balanced,0.2334666649500529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,4,power_law_1.2,0.1428096055984497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,balanced,0.23095999161402384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,4,power_law_1.2,0.14539519548416138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,balanced,0.23279466231664023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,4,power_law_1.2,0.15512959957122802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,balanced,0.23462400833765665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,4,power_law_1.2,0.15259519815444947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,balanced,0.23682133356730142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,4,power_law_1.2,0.17802879810333253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,balanced,0.2405386765797933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,balanced,0.24272533257802328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,4,power_law_1.2,0.18946559429168702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,balanced,0.25118933121363324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,4,power_law_1.2,0.2045759916305542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,balanced,0.2603466709454854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,balanced,0.2643253405888875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,balanced,0.2767519950866699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,4,power_law_1.2,0.2066495895385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,balanced,0.2975626587867737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,4,power_law_1.2,0.2408895969390869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,4,power_law_1.2,0.2799488067626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,balanced,0.31544532378514606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,4,power_law_1.2,0.39957120418548586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,balanced,0.3508586486180623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,4,power_law_1.2,0.5385983943939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,4,power_law_1.2,0.723635196685791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,balanced,0.39210665225982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,4,power_law_1.2,0.816915225982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,4,power_law_1.2,1.1093695640563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,balanced,0.47951467831929523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,4,power_law_1.2,1.6967679977416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,4,power_law_1.2,2.5875007629394533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,balanced,0.5612800121307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,4,power_law_1.2,3.5815486907958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,4,power_law_1.2,3.849375915527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,4,power_law_1.2,6.993682861328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,balanced,0.7755839824676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,balanced,0.03580799947182337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,4,power_law_1.2,13.9343994140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,balanced,0.05665066838264465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,balanced,0.08536000053087871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,balanced,0.9534347057342529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,balanced,0.136053333679835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,balanced,0.13748799761136374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,balanced,0.13923199971516928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,balanced,0.1393173336982727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,balanced,0.14230933785438538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,balanced,0.14365866780281067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,balanced,0.14597866932551065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,balanced,0.14995200435320535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,balanced,1.3783307075500488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,balanced,0.15150933464368185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,balanced,0.15577600399653116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,balanced,0.04580800235271454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,balanced,0.164000004529953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,balanced,0.16925867398579916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,balanced,0.05080533524354299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.01,0.05203199982643127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,balanced,0.18223466475804648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.01,0.04530560076236725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,balanced,0.061018665631612144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,balanced,0.20392000675201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.01,0.06527360081672669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,balanced,0.08989866574605306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,balanced,0.21849066019058228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.01,0.09237120151519776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,balanced,1.8375306129455566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,balanced,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.01,0.03821440041065216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.01,0.1211583971977234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,balanced,0.2563093304634094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,balanced,0.14501333236694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.01,0.0403903990983963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.01,0.19823999404907228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,balanced,0.14806933204332987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,balanced,0.2972693244616191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.01,0.05132799744606018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.01,0.20864639282226563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,balanced,0.14909332990646362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.01,0.21369600296020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.01,0.07088639736175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,balanced,0.1520639955997467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,balanced,0.15518400073051453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,balanced,0.3994400103886922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.01,0.21535999774932862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.01,0.08350080251693726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,balanced,0.1590559979279836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.01,0.22252159118652343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.01,0.12359039783477783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,balanced,0.16528000434239706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.01,0.23316481113433837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.01,0.12743680477142333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,balanced,0.4913333257039388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,balanced,0.17060265938440958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.01,0.23742079734802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,balanced,0.1768853267033895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.01,0.13185919523239137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,balanced,2.2619199752807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.01,0.24286720752716065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.01,0.1350399971008301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.01,0.2590208053588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.01,0.13891199827194214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,balanced,0.7121919790903727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.01,0.2669440031051636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.01,0.1441151976585388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,balanced,0.19346133867899576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.01,0.15535999536514283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.01,0.2762176036834717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,balanced,0.2002399961153666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.01,0.15652480125427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.01,0.28279039859771726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.01,0.16127359867095947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,balanced,0.9117919603983561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.01,0.3119488000869751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.01,0.17420799732208253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.01,0.3383104085922241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.01,0.1804479956626892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.01,0.39290881156921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.01,0.43797760009765624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,power_law_1.01,0.04838399887084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.01,0.1901311993598938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,balanced,0.22872000932693481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.01,0.5634943962097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.01,0.21950719356536866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,power_law_1.01,0.05023360252380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,balanced,1.3314026991526287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,balanced,0.2787253260612488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.01,0.6431615829467774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.01,0.23829119205474852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,power_law_1.01,0.0607807993888855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,balanced,0.3153013388315837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.01,0.911961555480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,balanced,3.4755465189615884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.01,0.2810175895690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,power_law_1.01,0.07637760043144226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,balanced,0.4218826691309611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.01,1.1488896369934083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,power_law_1.01,0.09324799776077271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.01,0.33098878860473635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.01,1.6144319534301759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,balanced,0.4891253312428792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,power_law_1.01,0.1266111969947815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.01,0.44021759033203123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.01,2.1004287719726564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,power_law_1.01,0.13640320301055908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.01,0.5325759887695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,balanced,0.7262880007425944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,power_law_1.01,0.14229120016098024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.01,2.5267391204833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.01,0.7981632232666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,balanced,1.764693260192871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,2,power_law_1.2,0.05170559883117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,power_law_1.01,0.14795520305633544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.01,1.0199487686157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.01,3.9938304901123045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,power_law_1.01,0.14999040365219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,balanced,0.888965368270874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,2,power_law_1.2,0.044614401459693906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.01,1.3808064460754395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,2,power_law_1.2,0.06298239827156067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,power_law_1.01,0.1601472020149231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.01,8.906623840332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,2,power_law_1.2,0.0880895972251892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,power_law_1.01,0.16958080530166625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.01,1.845363235473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,2,power_law_1.2,0.10811519622802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,balanced,1.3097973664601643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,power_law_1.01,0.18029439449310303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.01,2.4827392578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,2,power_law_1.2,0.1979647994041443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,power_law_1.01,0.19614720344543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,2,power_law_1.2,0.20614399909973144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.01,3.697132873535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,2,power_law_1.2,0.22058238983154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,balanced,2.198176066080729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,power_law_1.01,0.2076927900314331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,2,power_law_1.2,0.2221695899963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,balanced,1.7287626266479492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.01,8.587615966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,power_law_1.01,0.22780799865722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,2,power_law_1.2,0.23043839931488036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,2,power_law_1.2,0.23632640838623048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,2,power_law_1.2,0.24635519981384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,power_law_1.01,0.23919999599456787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,2,power_law_1.2,0.24753921031951903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,power_law_1.01,0.30344960689544676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,2,power_law_1.2,0.24964480400085448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,balanced,2.560277303059896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,power_law_1.01,0.37445759773254395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,2,power_law_1.2,0.26844799518585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,power_law_1.01,0.47434239387512206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,2,power_law_1.2,0.2797951936721802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,power_law_1.01,0.5791039943695069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,2,power_law_1.2,0.28703999519348145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,power_law_1.01,0.8470015525817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,2,power_law_1.2,0.32115840911865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,power_law_1.01,0.9892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,balanced,6.857237497965495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,2,power_law_1.2,0.341427206993103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,power_law_1.01,1.590841579437256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,2,power_law_1.2,0.4093503952026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,balanced,3.2428372701009116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,balanced,3.379151980082194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,2,power_law_1.2,0.46229119300842286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,power_law_1.01,2.0327423095703123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,2,power_law_1.2,0.5670591831207276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,power_law_1.01,2.8671552658081056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,2,power_law_1.2,0.7665279865264892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,2,power_law_1.2,0.9494272232055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,power_law_1.01,3.8895809173583986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,2,power_law_1.2,1.2340991973876954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,power_law_1.01,4.638956832885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,2,power_law_1.2,1.746847915649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,power_law_1.01,7.56903076171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,2,power_law_1.2,2.223846435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,2,power_law_1.2,0.03918080031871796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,balanced,4.199194590250651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,2,power_law_1.2,2.795257568359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,2,power_law_1.2,0.03831680119037628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,power_law_1.01,14.924954223632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,2,power_law_1.2,4.528793716430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,2,power_law_1.2,0.050291198492050174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,2,power_law_1.2,0.06802560091018676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,2,power_law_1.2,9.428985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,2,power_law_1.2,0.07949439883232116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,2,power_law_1.2,0.1230847954750061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,2,power_law_1.2,0.12751359939575196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,2,power_law_1.2,0.1327232003211975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,2,power_law_1.2,0.13808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,2,power_law_1.2,0.13776639699935914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,2,power_law_1.2,0.1468287944793701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,2,power_law_1.2,0.1540992021560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,2,power_law_1.2,0.15856000185012817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,balanced,6.6391042073567705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,2,power_law_1.2,0.16234240531921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,balanced,6.456213633219401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,2,power_law_1.2,0.17408640384674073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,2,power_law_1.2,0.18110719919204712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,2,power_law_1.2,0.19816319942474364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,2,power_law_1.2,0.2239680051803589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,2,power_law_1.2,0.24188799858093263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,2,power_law_1.2,0.2880255937576294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,2,power_law_1.2,0.35086081027984617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,2,power_law_1.2,0.47097601890563967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,2,power_law_1.2,0.5366911888122559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,2,power_law_1.2,0.8702527999877929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,2,power_law_1.2,1.01594877243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,2,power_law_1.2,1.5125568389892579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,2,power_law_1.2,1.9709312438964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,2,power_law_1.2,2.566873550415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,2,power_law_1.2,4.490681457519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,2,power_law_1.2,8.225856018066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,balanced,13.22338612874349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,2,power_law_1.2,0.048307201266288756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,2,power_law_1.2,0.04924159944057464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,2,power_law_1.2,0.05740159749984741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,balanced,0.04196266829967499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,2,power_law_1.2,0.07255679965019227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,balanced,0.05492266515890757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,2,power_law_1.2,0.08115839958190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,balanced,0.07905066510041554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,2,power_law_1.2,0.12718720436096193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,balanced,0.1304693321386973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,2,power_law_1.2,0.1382464051246643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,balanced,0.23195199171702066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,balanced,0.2345973253250122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,2,power_law_1.2,0.14804480075836182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,balanced,0.2371573249499003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,2,power_law_1.2,0.14864640235900878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,balanced,0.2400266726811727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,2,power_law_1.2,0.1556607961654663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,balanced,0.24172266324361166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,balanced,0.24022932847340903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,2,power_law_1.2,0.16550400257110595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,balanced,0.24703466892242432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,balanced,0.25065066417058307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,2,power_law_1.2,0.17292799949645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,2,power_law_1.2,0.1835263967514038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,balanced,0.25541333357493085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,balanced,0.2669173280398051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,2,power_law_1.2,0.20417919158935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,balanced,0.28406399488449097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,balanced,0.03932266682386398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,balanced,0.2898346583048503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,balanced,0.04515199859937032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,2,power_law_1.2,0.2116863965988159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,balanced,0.3158880074818929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,balanced,0.06217066446940104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,2,power_law_1.2,0.23455359935760497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,balanced,0.09595200419425964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,balanced,0.3540000120798747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,balanced,0.15210666259129843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,balanced,0.3717706600824992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,2,power_law_1.2,0.22967679500579835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,balanced,0.15506133437156677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,2,power_law_1.2,0.2966975927352905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,balanced,0.15727999806404114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,2,power_law_1.2,0.3886656045913696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,balanced,0.43078935146331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,balanced,0.15921066204706827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,2,power_law_1.2,0.5343488216400146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,balanced,0.16139733791351318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,2,power_law_1.2,0.5772863864898682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,balanced,0.49302931626637775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,balanced,0.16339199741681418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,2,power_law_1.2,0.7975615978240966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,balanced,0.16710933049519858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,2,power_law_1.2,1.1576512336730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,balanced,0.1707520087560018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,2,power_law_1.2,1.652556800842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,balanced,0.7001386483510336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,balanced,0.17633599042892456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,2,power_law_1.2,2.1004032135009765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,balanced,0.1844480037689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,2,power_law_1.2,3.0935487747192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,balanced,0.19751467307408652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,balanced,0.8736053307851156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,balanced,0.20575465758641562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,2,power_law_1.2,3.904275131225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,balanced,0.23363200823465982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,2,power_law_1.2,5.0315711975097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.04302079975605011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,balanced,0.26735466718673706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,2,power_law_1.2,7.969427490234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,balanced,1.257530689239502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.04708479940891266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,balanced,0.28970666726430255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.0657151997089386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,balanced,0.3495146830876668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,2,power_law_1.2,17.14775695800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.09314560294151306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,balanced,0.3992053270339966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,balanced,1.5877760251363118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.11817599534988403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,balanced,0.06751466790835063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,balanced,0.5789706707000732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,balanced,0.07232533395290375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.037651199102401736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.20060160160064697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,balanced,0.08091199894746144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.04115839898586273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,balanced,0.11317333579063416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.21100161075592042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,balanced,0.7621973355611166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,balanced,0.1688800056775411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.05573760271072388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.22275199890136718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,balanced,0.17867734034856161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.07433599829673768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,balanced,2.345482667287191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,balanced,0.18105600277582803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.22650880813598634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.09214079976081849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,balanced,1.1616053581237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,balanced,0.18381333351135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.13308800458908082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.23405439853668214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,balanced,0.19057599703470865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.1417088031768799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.243174409866333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,balanced,0.19497066736221313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.14572800397872926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,balanced,0.20244799057642618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.2597120046615601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.15278719663619994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,balanced,0.21357866128285727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.15900800228118897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,balanced,1.5185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.2743680000305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,balanced,0.2222986618677775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.16556160449981688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,balanced,0.23465067148208618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.28066558837890626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.17798399925231934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,balanced,3.077434539794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.19064320325851442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.29764480590820314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.1879680037498474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.3086656093597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.204915189743042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,balanced,0.261952002843221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.22026240825653076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.3214848041534424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,balanced,0.2776479919751485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,balanced,2.261408011118571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.24381439685821532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.3829119920730591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.28849918842315675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.3899967908859253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.3202687978744507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.3793344020843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.47162880897521975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,0.4627967834472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,balanced,0.35259731610616046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,0.6156352043151856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.5362239837646484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,balanced,3.847834587097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,0.7572927951812745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,balanced,0.4434933265050252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.7016767978668212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,1.1084735870361329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,balanced,2.9822025299072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,balanced,0.49076799551645917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.8803647994995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,1.4636032104492187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,balanced,0.6877600351969401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.01,1.2740799903869628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,2.1916032791137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,power_law_1.01,0.059622400999069215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.01,1.5491071701049806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,balanced,0.81877334912618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,2.9255935668945314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,power_law_1.01,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.01,2.2523712158203124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,power_law_1.01,0.07617279887199402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.01,3.625484848022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,balanced,1.2676106293996174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,power_law_1.01,0.09200639724731445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.01,2.9326335906982424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.04296320080757141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.01,5.7533119201660154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,power_law_1.01,0.10944000482559205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.01,3.6326080322265626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,power_law_1.01,0.15385600328445434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.04780159890651703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,balanced,1.5700373649597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,power_law_1.01,0.1627519965171814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,balanced,3.717162768046061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.01,11.417964935302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,power_law_1.01,0.172160005569458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.01,6.0277759552001955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.08743680119514466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,power_law_1.01,0.18188159465789794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.108787202835083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,balanced,2.3229920069376626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,balanced,5.5695037841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,power_law_1.01,0.1907263994216919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.01,11.978495788574218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.1999935984611511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,power_law_1.01,0.20396161079406738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.2149440050125122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,power_law_1.01,0.22147839069366454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.22191359996795654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,power_law_1.01,0.2342463970184326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,balanced,3.049541473388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,power_law_1.01,0.26095359325408934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.2337536096572876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.2356031894683838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.2544640064239502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,power_law_1.01,0.27870080471038816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.263590407371521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,power_law_1.01,0.307423996925354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.27048320770263673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,balanced,4.531434694925944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,balanced,5.434858957926433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,power_law_1.01,0.3493056058883667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.2791424036026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.29575679302215574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,power_law_1.01,0.4535679817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.01,0.5398464202880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.3151808023452759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.32856318950653074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.01,0.7197887897491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.3890048027038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.01,0.8923775672912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.3973632097244263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.01,1.2539327621459961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,balanced,5.988192240397136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.47655038833618163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.01,1.6129215240478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.5424895763397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.01,2.34771842956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.7165823936462402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.01,3.088038444519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.9001472473144532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.01,4.5550590515136715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,1,power_law_1.2,1.286284828186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,1,power_law_1.2,1.6039552688598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.01,6.014771270751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,1,power_law_1.2,2.2964672088623046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.01,7.480000305175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,1,power_law_1.2,2.980544090270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,balanced,7.466117223103841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,balanced,11.386608123779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,power_law_1.01,11.858220672607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,1,power_law_1.2,3.6787391662597657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,1,power_law_1.2,6.047507095336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,power_law_1.01,23.509829711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,1,power_law_1.2,11.96319351196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,balanced,10.922096252441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.037299200892448425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.04082559943199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.052902400493621826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,balanced,11.823248545328775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.07009279727935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.08357120156288148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.13275519609451295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.14177919626235963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.15162880420684816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.1561792016029358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.16483839750289916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.1670591950416565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.18261120319366456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.1925376057624817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.1935487985610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.20967679023742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.22335999011993407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.24780800342559814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.29344000816345217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.32094080448150636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.3894912004470825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,0.463756799697876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,0.6166656017303467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,0.7661952018737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,1.1137215614318847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,1.4843711853027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,2.22542724609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,2.9396480560302733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,1,power_law_1.2,3.667782211303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,1,power_law_1.2,5.780422210693359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,1,power_law_1.2,11.460031890869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,balanced,23.517903645833332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,balanced,0.08534399668375652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,balanced,0.10620266199111938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,1,power_law_1.2,0.06093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,balanced,0.16204266746838888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,balanced,0.2950773239135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,1,power_law_1.2,0.0689791977405548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,balanced,0.528767983118693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,1,power_law_1.2,0.07553920149803162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,balanced,0.6683146953582764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,1,power_law_1.2,0.08826239705085755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,balanced,0.6670773029327393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,1,power_law_1.2,0.10648959875106812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,1,power_law_1.2,0.15210880041122438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,balanced,0.6672320365905762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,1,power_law_1.2,0.16562559604644775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,balanced,0.6713386376698812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,1,power_law_1.2,0.17724159955978394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,balanced,0.6688586870829264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,1,power_law_1.2,0.1860159993171692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,balanced,0.6706666946411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,1,power_law_1.2,0.19151359796524048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,balanced,0.6786293188730875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,1,power_law_1.2,0.20663681030273437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,balanced,0.6786293188730875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,1,power_law_1.2,0.22092161178588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,balanced,0.6851306756337484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,1,power_law_1.2,0.23709440231323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,balanced,0.6901066303253174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,1,power_law_1.2,0.2606015920639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,balanced,0.697754700978597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,balanced,0.7028693358103434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,balanced,0.746287981669108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,1,power_law_1.2,0.28485119342803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,balanced,0.739786704381307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,1,power_law_1.2,0.3117759943008423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,balanced,0.9442880153656006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,balanced,0.06055466830730438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,1,power_law_1.2,0.35199999809265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,balanced,0.8165760040283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,balanced,0.07412800192832947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,1,power_law_1.2,0.45383682250976565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,balanced,0.10595200459162395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.2,0.5418047904968262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,balanced,0.17192000150680542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,balanced,1.214687983194987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,balanced,0.2995679974555969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.2,0.7282048225402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,balanced,0.36324799060821533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.2,0.8973119735717774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,balanced,0.36582934856414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.2,1.258687973022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,balanced,0.9647040367126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,balanced,0.3662079970041911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.2,1.616499137878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,balanced,0.3670773506164551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,balanced,0.37588798999786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.2,2.3566207885742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,balanced,0.3728213310241699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.2,3.0895999908447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.01,0.2848320007324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,balanced,0.3724213441212972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,balanced,1.4825280507405598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.2,4.560550308227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,balanced,0.3803679943084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,balanced,0.3853973150253296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.2,6.015961456298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.01,0.4296895980834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,balanced,0.39722665150960285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.01,0.16650880575180055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.2,7.453887939453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,balanced,0.39584533373514813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,balanced,1.5806186993916829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,balanced,0.4057493209838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.01,0.29015679359436036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,1,power_law_1.2,11.827449798583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.17864320278167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,balanced,0.45784000555674237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.01,0.3462591886520386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,balanced,0.4349973201751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.2355072021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,balanced,0.05946666498978933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.01,0.560422420501709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,1,power_law_1.2,23.46705322265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.10059520006179809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,balanced,0.07234133283297221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,balanced,0.546832005182902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.01,0.16302080154418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.01,0.5362175941467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,balanced,0.11378133296966553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,balanced,2.311072031656901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.20494720935821534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,balanced,0.18797866503397623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.01,0.5791552066802979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,balanced,0.5074453353881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,balanced,0.28588799635569256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.01,0.28475520610809324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.01,0.6163968086242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,balanced,0.35278932253519696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.01,0.3167871952056885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,balanced,0.7770240306854248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.01,0.6326464176177978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,balanced,0.3556266625722249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.01,0.3133888006210327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.01,0.6352640151977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,balanced,0.35782400767008465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.01,0.3368832111358643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,balanced,0.35949333508809406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,balanced,0.6504106521606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.01,0.6843711853027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.01,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,balanced,0.3612693150838216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.01,0.7014527797698975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,balanced,0.3644160032272339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.01,0.3543551921844482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,balanced,0.36802132924397785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.01,0.6914432048797607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,balanced,3.669871966044108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.01,0.34703359603881834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,balanced,0.37196799119313556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.01,0.7399040222167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,balanced,0.9920480251312256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.01,0.3637952089309692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.01,0.8071488380432129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,balanced,0.3771573305130005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.01,0.3687295913696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.01,0.7754496097564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,balanced,0.3863840103149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.01,0.4038400173187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.01,0.8950464248657226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.01,0.42368640899658205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.01,0.9361472129821777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.01,0.4359871864318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.01,1.1917823791503905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,balanced,1.0842613379160564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.01,1.1639936447143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.01,0.49496960639953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.01,1.4094079971313476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,0.5062143802642822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,balanced,0.39396798610687256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.01,1.6334783554077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,0.5892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.01,2.018195152282715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,0.7636735916137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.01,2.3924800872802736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,balanced,4.108720143636067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,0.9364416122436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.01,2.9844032287597657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,balanced,1.4696426391601562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,1.0193663597106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.01,5.061183929443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,balanced,0.4083626667658488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,1.2927680015563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.01,5.96165771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,1.4781439781188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.01,9.322809600830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,2.209011268615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,2.970572853088379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.01,16.77411804199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.01,3.897126388549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,8,power_law_1.2,0.2849663972854614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,balanced,2.0289546648661294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,balanced,0.42601601282755536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.01,5.328697586059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,8,power_law_1.2,0.18595839738845826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,balanced,0.4466346502304077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,8,power_law_1.2,0.17896319627761842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,power_law_1.01,0.16844160556793214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.01,10.530169677734374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,8,power_law_1.2,0.22087678909301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,power_law_1.01,0.24647040367126466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,8,power_law_1.2,0.3137471914291382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,power_law_1.01,0.11559040546417236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,8,power_law_1.2,0.5475391864776611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,balanced,5.799946467081706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,power_law_1.01,0.1651520013809204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,8,power_law_1.2,0.5457151889801025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,power_law_1.01,0.18958719968795776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,8,power_law_1.2,0.5839231967926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,power_law_1.01,0.26845440864562986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,8,power_law_1.2,0.6234879970550538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,power_law_1.01,0.3214207887649536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,balanced,2.132362683614095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,balanced,0.4989440043767293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,8,power_law_1.2,0.5845503807067871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,power_law_1.01,0.3322688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,power_law_1.01,0.32962560653686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,8,power_law_1.2,0.6838335990905762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,balanced,0.554533322652181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,power_law_1.01,0.331328010559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,8,power_law_1.2,0.7074175834655761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,power_law_1.01,0.3660928010940552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,8,power_law_1.2,0.6953919887542724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,power_law_1.01,0.36675200462341306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,8,power_law_1.2,0.7387968063354492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,balanced,0.781925360361735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,power_law_1.01,0.39629440307617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,8,power_law_1.2,0.7771520137786865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,8,power_law_1.2,0.8560064315795899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,power_law_1.01,0.42827520370483396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,8,power_law_1.2,0.8339008331298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,balanced,0.8831360340118408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,power_law_1.01,0.4657855987548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,8,power_law_1.2,0.9552319526672364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,8,power_law_1.2,1.0254719734191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,8,power_law_1.2,1.218118381500244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,power_law_1.01,0.4453887939453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,8,power_law_1.2,1.2322688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,balanced,1.2909493446350098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,8,power_law_1.2,1.6892032623291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,8,power_law_1.2,1.8298688888549806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,power_law_1.01,0.49646720886230467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,balanced,3.610581398010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,8,power_law_1.2,2.40948486328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,8,power_law_1.2,2.6822015762329103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,balanced,1.6994880040486653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,power_law_1.01,0.5168896198272706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,8,power_law_1.2,3.6927295684814454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.01,0.5768703937530517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,8,power_law_1.2,6.567628479003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,8,power_law_1.2,7.843878173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.01,0.6947328090667725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.01,0.7966400146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,8,power_law_1.2,12.548889923095704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,balanced,2.3052639961242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.01,1.0624704360961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.01,1.3741567611694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,balanced,9.535754521687826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.01,1.841049575805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,8,power_law_1.2,27.536767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.01,2.4229440689086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.01,3.675532913208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.01,4.571750259399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,balanced,3.1042133967081704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,power_law_1.01,6.241433715820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,power_law_1.01,11.571405029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.17920000553131105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,power_law_1.01,22.107180786132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.11918079853057861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.11745920181274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,8,power_law_1.2,0.14931199550628663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,balanced,3.746986707051595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.17957119941711425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,8,power_law_1.2,0.2889919996261597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,balanced,6.6402028401692705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,8,power_law_1.2,0.32792959213256834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,8,power_law_1.2,0.3253376007080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,8,power_law_1.2,0.33861119747161866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,8,power_law_1.2,0.3427520036697388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,8,power_law_1.2,0.3437311887741089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,8,power_law_1.2,0.3621567964553833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,8,power_law_1.2,0.3845056056976318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,8,power_law_1.2,0.40052480697631837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,8,power_law_1.2,0.40369281768798826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,8,power_law_1.2,0.4414527893066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,balanced,6.025093078613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,8,power_law_1.2,0.45066242218017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,8,power_law_1.2,0.508358383178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,0.5604671955108642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,0.6477056026458741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,0.7442111968994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,0.957913589477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,1.074009609222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,1.3906559944152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,1.8478015899658202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,2.61267204284668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,3.771091079711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,8,power_law_1.2,4.610291290283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,8,power_law_1.2,0.16892800331115723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,8,power_law_1.2,0.08886399865150452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,8,power_law_1.2,7.445887756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,8,power_law_1.2,0.10130560398101807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,8,power_law_1.2,0.15869439840316774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,8,power_law_1.2,0.1844032049179077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,balanced,0.07650133470694225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,8,power_law_1.2,13.753875732421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,8,power_law_1.2,0.2892927885055542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,balanced,0.1037013332049052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,8,power_law_1.2,0.3080384016036987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,balanced,0.15787733594576517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,8,power_law_1.2,0.33327999114990237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,balanced,0.28707732756932575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,8,power_law_1.2,0.32032639980316163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,balanced,0.5293493270874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,8,power_law_1.2,0.3621376037597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,balanced,0.6666879653930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,8,power_law_1.2,0.3812927961349487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,balanced,0.6656586726506551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,8,power_law_1.2,0.3951359987258911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,balanced,0.675493319829305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,balanced,12.529120127360025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,balanced,0.6753333409627279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,8,power_law_1.2,0.43388800621032714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,balanced,0.6781546274820963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,8,power_law_1.2,0.4329728126525879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,balanced,0.6766666571299235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,8,power_law_1.2,0.46657280921936034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,balanced,0.6834719975789388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,balanced,0.6847999890645345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,balanced,0.6924906571706136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,8,power_law_1.2,0.46766080856323244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,balanced,0.700709342956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,balanced,0.7064266999562582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,8,power_law_1.2,0.5059904098510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,balanced,0.7182613213857015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,balanced,0.7448480129241943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,balanced,0.7592053413391113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,8,power_law_1.2,0.543449592590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.2,0.6322688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,balanced,1.077349344889323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,balanced,0.8533546924591064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.2,0.7520832061767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.2,0.9278464317321777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,balanced,1.2415573596954346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.2,1.2613183975219726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.2,1.4393792152404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.2,2.383251190185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,balanced,1.046506643295288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.2,2.916089630126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.2,4.309190368652343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,balanced,1.6139307022094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.2,6.0587646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,balanced,0.06055466830730438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,8,power_law_1.2,8.039641571044921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,balanced,0.07375466823577881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,balanced,0.10770666599273682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,8,power_law_1.2,12.374809265136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,balanced,0.1705120007197062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,balanced,1.732906659444173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,balanced,0.293232003847758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,balanced,0.3601706822713216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.01,0.1775488018989563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,balanced,0.36006398995717365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,8,power_law_1.2,28.049383544921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,balanced,0.36186667283376056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.01,0.253004789352417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,balanced,0.062218666076660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,balanced,0.36315735181172687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.01,0.14675840139389038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,balanced,0.3696693181991577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,balanced,0.07515199979146321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,balanced,2.281701405843099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,balanced,0.3714453379313151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,balanced,0.11431466539700826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.01,0.24897921085357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,balanced,0.17588265736897787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,balanced,0.3729439973831177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,balanced,0.29053332408269245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,balanced,0.3753439982732137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.01,0.3130880117416382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,balanced,0.3575199842453003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,balanced,0.38468265533447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,balanced,0.36141331990559894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.01,0.5506559848785401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,balanced,0.3944106499354045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,balanced,0.36396265029907227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.01,0.558080005645752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.01,0.11684479713439941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,balanced,0.3663146495819092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,balanced,0.4004533290863037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.01,0.55829758644104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,balanced,0.368938684463501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.01,0.14890240430831908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,balanced,3.035397211710612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,balanced,0.4034239848454793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,balanced,0.3743893305460612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.01,0.6062655925750733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.01,0.09054080247879029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,balanced,0.46485865116119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,balanced,0.37915201981862384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.01,0.5840320110321044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.01,0.15436160564422607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,balanced,0.3839626709620158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,balanced,0.45070401827494305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.01,0.6029503822326661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.01,0.18402559757232667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,balanced,0.3920160134633382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.01,0.6589439868927002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.01,0.29216001033782957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,balanced,0.5788160165150961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,balanced,0.4063200155893962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.01,0.3095423936843872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.01,0.6767551898956299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,balanced,0.5427999893824259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.01,0.33000319004058837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.01,0.6699647903442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.01,0.3405695915222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.01,0.7006015777587891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.01,0.3543231964111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,balanced,0.7367520332336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.01,0.702182388305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,balanced,3.337002754211426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,balanced,0.41461865107218426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.01,0.3492288112640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.01,0.7550015926361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.01,0.36470398902893064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.01,0.8428671836853028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,balanced,0.7317600250244141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.01,0.36419200897216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.01,0.8492799758911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.01,0.3758399963378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.01,0.978054428100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.01,0.39996159076690674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,balanced,0.43243734041849774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.01,1.1263551712036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.01,0.3996608018875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,balanced,1.108016014099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.01,1.3857536315917969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.01,0.42473602294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.01,1.508396816253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.01,0.516428804397583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.01,0.5077695846557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.01,1.8265472412109376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.01,0.6060031890869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.01,2.384556770324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,balanced,1.3353759447733562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.01,0.6381951808929444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.01,3.2985984802246096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.01,0.8046719551086425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,balanced,0.46215466658274335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.01,0.9928128242492675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.01,4.448979187011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,balanced,5.921194712320964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,balanced,0.5052160024642944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.01,1.191551971435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.01,5.314822387695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.01,1.499788761138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,balanced,1.7232426007588704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.01,2.334783935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.01,8.534835052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,balanced,0.5936479965845743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.01,2.8865983963012694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.01,14.071878051757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.01,3.607660675048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,balanced,0.6718933582305908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,power_law_1.01,0.1174015998840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.01,5.715603256225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,power_law_1.01,0.14354560375213624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,balanced,0.9501866499582926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,power_law_1.01,0.10833280086517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.01,10.45291519165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,power_law_1.01,0.15482239723205565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,balanced,2.3283519744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,balanced,1.1118240356445312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,power_law_1.01,0.17363200187683106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,4,power_law_1.2,0.17598079442977904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,power_law_1.01,0.29074559211730955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,4,power_law_1.2,0.11818239688873292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,power_law_1.01,0.3078783988952637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,4,power_law_1.2,0.14382719993591309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,power_law_1.01,0.3186176061630249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,balanced,1.6087946891784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,4,power_law_1.2,0.23153278827667237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,power_law_1.01,0.32794239521026614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,4,power_law_1.2,0.315775990486145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,power_law_1.01,0.338809609413147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,4,power_law_1.2,0.5157440185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,power_law_1.01,0.36745600700378417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,4,power_law_1.2,0.5494976043701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,balanced,2.116480032602946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,balanced,2.7869653701782227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,power_law_1.01,0.3927488088607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,4,power_law_1.2,0.5708608150482177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,power_law_1.01,0.3965183973312378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,4,power_law_1.2,0.6093247890472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,power_law_1.01,0.41792640686035154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,4,power_law_1.2,0.6124864101409913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,power_law_1.01,0.47509121894836426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,4,power_law_1.2,0.6651264190673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,4,power_law_1.2,0.6723840236663818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,balanced,2.9267091751098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,4,power_law_1.2,0.7195072174072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,power_law_1.01,0.44417920112609866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,4,power_law_1.2,0.6990719795227051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,balanced,12.014906565348307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,4,power_law_1.2,0.6814911842346192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,4,power_law_1.2,0.7426559925079346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,power_law_1.01,0.49298558235168455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,4,power_law_1.2,0.7575424194335938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,4,power_law_1.2,0.886079978942871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,power_law_1.01,0.5105343818664551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,4,power_law_1.2,0.9092288017272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,balanced,3.9530986150105796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,power_law_1.01,0.6137216091156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,4,power_law_1.2,1.0497471809387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,balanced,4.24567985534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,4,power_law_1.2,1.1454208374023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,power_law_1.01,0.7157055854797363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,4,power_law_1.2,1.3829952239990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,power_law_1.01,0.9100735664367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,4,power_law_1.2,1.5164095878601074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,power_law_1.01,1.148748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,power_law_1.01,1.356991958618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,4,power_law_1.2,1.9652864456176757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,power_law_1.01,1.9288896560668944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,4,power_law_1.2,0.10623359680175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,4,power_law_1.2,2.4764736175537108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,power_law_1.01,2.680806350708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,balanced,4.777071952819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,4,power_law_1.2,0.07465599775314331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,4,power_law_1.2,3.943385696411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,4,power_law_1.2,0.09259520173072815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,power_law_1.01,3.8358463287353515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,4,power_law_1.2,0.14790400266647338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,4,power_law_1.2,5.465343856811524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,power_law_1.01,5.5311424255371096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,4,power_law_1.2,0.17920000553131105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,4,power_law_1.2,0.28263039588928224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,4,power_law_1.2,5.832992172241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,power_law_1.01,6.355136108398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,4,power_law_1.2,0.30090880393981934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,4,power_law_1.2,0.3178879976272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,4,power_law_1.2,8.82416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,4,power_law_1.2,0.33133440017700194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,power_law_1.01,10.053107452392577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,4,power_law_1.2,0.3478912115097046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,4,power_law_1.2,0.35818240642547605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,4,power_law_1.2,0.3689152002334595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,4,power_law_1.2,19.521165466308595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,power_law_1.01,20.927449035644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,4,power_law_1.2,0.3554176092147827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,4,power_law_1.2,0.37786240577697755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,4,power_law_1.2,0.3997056007385254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,4,power_law_1.2,0.4024640083312988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,4,power_law_1.2,0.43137922286987307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,4,power_law_1.2,0.5278592109680176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,balanced,7.945525487263997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,4,power_law_1.2,0.5452544212341308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,4,power_law_1.2,0.6516223907470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,4,power_law_1.2,0.6532224178314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,4,power_law_1.2,0.8353856086730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,4,power_law_1.2,1.039072036743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,4,power_law_1.2,1.284601593017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,balanced,8.51753044128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,4,power_law_1.2,1.7627904891967774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,4,power_law_1.2,2.431430435180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,4,power_law_1.2,2.979635238647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,4,power_law_1.2,4.22545280456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,4,power_law_1.2,6.364198303222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,4,power_law_1.2,12.342098999023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,balanced,16.089771270751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,4,power_law_1.2,0.11724799871444702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,4,power_law_1.2,0.07556480169296265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,4,power_law_1.2,0.1029312014579773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,balanced,0.07762666543324788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,4,power_law_1.2,0.13366400003433226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,balanced,0.10409067074457805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,4,power_law_1.2,0.17564799785614013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,4,power_law_1.2,0.2838207960128784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,balanced,0.15970133741696677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,4,power_law_1.2,0.31286399364471434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,balanced,0.29924799998601276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,4,power_law_1.2,0.32210559844970704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,4,power_law_1.2,0.3407167911529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,balanced,0.5437920093536377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,4,power_law_1.2,0.3516671895980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,balanced,0.6829280058542887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,balanced,0.6890400250752767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,4,power_law_1.2,0.37396481037139895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,balanced,0.703167994817098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,4,power_law_1.2,0.394649600982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,balanced,0.7073386510213217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,4,power_law_1.2,0.4149312019348145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,balanced,0.7063306967417399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,4,power_law_1.2,0.44216318130493165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,balanced,0.706501324971517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,4,power_law_1.2,0.4946944236755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,balanced,0.71561066309611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,balanced,0.714629332224528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,balanced,0.06010133524735769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,balanced,0.7239680290222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,4,power_law_1.2,0.4496895790100098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,balanced,0.7353973388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,balanced,0.0740586668252945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,balanced,0.10521066188812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,balanced,0.7430133024851481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,balanced,0.17212265729904175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,4,power_law_1.2,0.5094592094421386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,balanced,0.758629322052002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,balanced,0.3015893300374349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,balanced,0.3599840005238851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,balanced,0.8653546969095866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,4,power_law_1.2,0.5595392227172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,balanced,0.37061333656311035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,balanced,0.8251893520355225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,balanced,0.3681173324584961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,4,power_law_1.2,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,balanced,0.3720426559448242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,balanced,0.8826826413472494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,balanced,0.3754133383433024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,4,power_law_1.2,0.7592895984649658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,balanced,0.3813440004984538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,balanced,0.9853653113047282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,balanced,0.3842560052871704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,4,power_law_1.2,0.9653759956359863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,balanced,0.3866879940032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,4,power_law_1.2,1.2050496101379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,balanced,0.39317866166432697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,4,power_law_1.2,1.579411220550537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,balanced,1.2516907056172688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,balanced,0.40611732006073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,4,power_law_1.2,2.0973440170288087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,balanced,0.4116213321685791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,4,power_law_1.2,2.96060791015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,balanced,1.268346627553304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,balanced,0.4294240077336629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,4,power_law_1.2,4.300774383544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,balanced,0.511301318804423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,4,power_law_1.2,5.470073699951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,balanced,0.49902931849161786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,balanced,2.1890719731648765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,4,power_law_1.2,7.376076507568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,balanced,0.5629013379414877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,4,power_law_1.2,11.033401489257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,balanced,0.6403306722640991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.01,0.11281919479370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,balanced,2.1180319786071777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.01,0.13379199504852296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,balanced,0.8583040237426758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,4,power_law_1.2,24.123948669433595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.01,0.13437440395355224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.01,0.22172799110412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,balanced,0.9323200384775797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.01,0.29594879150390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.01,0.5185344219207764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,balanced,0.0731573353211085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.01,0.5375360012054443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,balanced,0.08238933483759563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.01,0.5547200202941894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,balanced,2.7665332158406577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,balanced,1.3746132850646973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,balanced,0.11178666353225708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.01,0.5796735763549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,balanced,0.19722666343053183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.01,0.5883456230163574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,balanced,0.30085867643356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.01,0.6368000030517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,balanced,0.3677440087000529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.01,0.6300543785095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,balanced,0.37379733721415204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,balanced,0.376911997795105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,balanced,1.6178186734517415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.01,0.6439231872558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,balanced,0.3821973403294881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.01,0.6983488082885743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,balanced,0.3862186670303345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,balanced,0.3930079936981201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.01,0.07807360291481018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.01,0.7322944164276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,balanced,0.4024746815363566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,balanced,3.9094667434692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.01,0.7637184143066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.01,0.09076480269432068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,balanced,0.40879468123118085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,balanced,0.4222079912821452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.01,0.09303680062294006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.01,0.7936448097229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,balanced,0.44069866339365643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,balanced,2.270789305369059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.01,0.13494399785995484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.01,0.9919679641723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.01,0.1699136018753052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.01,0.9148351669311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.01,0.28615679740905764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.01,1.109273624420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,balanced,0.4551413456598918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.01,0.29605119228363036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.01,1.048198413848877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.01,0.321727991104126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.01,1.2645759582519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.01,0.323686408996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.01,1.7657791137695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,balanced,4.364432017008464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.01,0.33402879238128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,balanced,2.95794677734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,power_law_1.01,0.08789119720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.01,2.3603328704833983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.01,0.34214398860931394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,balanced,0.49452801545461017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.01,0.3591232061386108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,power_law_1.01,0.11742719411849975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.01,2.3092159271240233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.01,0.3665152072906494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,power_law_1.01,0.0939136028289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.01,3.661190414428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.01,0.36613121032714846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,power_law_1.01,0.14928640127182008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.01,0.3953855991363525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,power_law_1.01,0.19372160434722902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.01,4.448851013183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.01,0.4003647804260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,power_law_1.01,0.2888319969177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.01,0.43856000900268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.01,5.396294403076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,balanced,0.5773226817448934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,power_law_1.01,0.31832959651947024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.01,0.5158656120300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,power_law_1.01,0.3183487892150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.01,0.5158592224121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,balanced,0.6399733225504557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.01,9.47022705078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,power_law_1.01,0.3425280094146729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.01,0.6208191871643066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,power_law_1.01,0.35319039821624754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,balanced,3.4872639973958335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.01,0.6703296184539795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,power_law_1.01,0.37226879596710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.01,0.8662912368774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.01,13.728224182128907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.01,1.0753536224365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,power_law_1.01,0.39385600090026857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,balanced,0.7875946362813314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.01,1.384870433807373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,power_law_1.01,0.41054720878601075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,2,power_law_1.2,0.11214720010757447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.01,1.7329856872558593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,power_law_1.01,0.45427842140197755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,balanced,0.9247573216756185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,balanced,7.524421056111653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,2,power_law_1.2,0.10339200496673584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,power_law_1.01,0.49129600524902345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.01,2.450592041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,2,power_law_1.2,0.11340800523757935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,balanced,1.3657546043395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.01,3.4341888427734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,2,power_law_1.2,0.1973952054977417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,power_law_1.01,0.4859327793121338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.01,4.151520156860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,2,power_law_1.2,0.2778496026992798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,balanced,1.6428160667419434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.01,6.4477699279785154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,2,power_law_1.2,0.5305280208587646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,power_law_1.01,0.5438720226287842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,2,power_law_1.2,0.5593664169311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.01,11.934060668945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,2,power_law_1.2,0.5670400142669678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,balanced,2.374565283457438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,2,power_law_1.2,0.5866623878479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,power_law_1.01,0.6138239860534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,balanced,5.673952102661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,2,power_law_1.2,0.5951104164123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,power_law_1.01,0.7173632144927978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,2,power_law_1.2,0.6610112190246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,2,power_law_1.2,0.6685184001922607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,balanced,3.1014026006062827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,power_law_1.01,0.8813504219055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,2,power_law_1.2,0.6663616180419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,power_law_1.01,1.0429951667785644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,2,power_law_1.2,0.6963583946228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,power_law_1.01,1.3932095527648927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,2,power_law_1.2,0.7516863822937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,power_law_1.01,1.8157503128051757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,2,power_law_1.2,0.7663167953491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,power_law_1.01,2.6013439178466795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,2,power_law_1.2,0.8505855560302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,balanced,4.37940788269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,2,power_law_1.2,1.0006655693054198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,power_law_1.01,3.372383880615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,2,power_law_1.2,0.9523712158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,2,power_law_1.2,1.1464896202087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,power_law_1.01,5.036435317993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,2,power_law_1.2,1.0483519554138183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,power_law_1.01,6.687961578369141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,2,power_law_1.2,1.3951104164123536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,power_law_1.01,7.743059539794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,2,power_law_1.2,1.89486083984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,balanced,5.913962682088216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,2,power_law_1.2,2.4499711990356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,power_law_1.01,12.767743682861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,2,power_law_1.2,2.7048576354980467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,balanced,13.92749277750651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,2,power_law_1.2,3.8128318786621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,power_law_1.01,25.435501098632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,2,power_law_1.2,5.276038360595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,2,power_law_1.2,5.93950080871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,2,power_law_1.2,9.536268615722657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,balanced,7.10590934753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,balanced,11.034346262613932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,2,power_law_1.2,14.93170623779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,2,power_law_1.2,0.07767040133476258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,2,power_law_1.2,0.06638720035552978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,2,power_law_1.2,0.08624640107154846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,balanced,11.7937380472819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,2,power_law_1.2,0.12602239847183228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,2,power_law_1.2,0.16469119787216185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,2,power_law_1.2,0.28204801082611086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,2,power_law_1.2,0.30312960147857665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,2,power_law_1.2,0.32756481170654295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,2,power_law_1.2,0.3267712116241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,2,power_law_1.2,0.3452159881591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,2,power_law_1.2,0.3650304079055786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,2,power_law_1.2,0.37153921127319334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,2,power_law_1.2,0.37854719161987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,2,power_law_1.2,0.3882175922393799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,2,power_law_1.2,0.4100351810455322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,2,power_law_1.2,0.4262847900390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,2,power_law_1.2,0.45352959632873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,2,power_law_1.2,0.5292928218841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,2,power_law_1.2,0.5381824016571045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,2,power_law_1.2,0.6212351799011231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,2,power_law_1.2,0.7144896030426026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,2,power_law_1.2,0.9128959655761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,2,power_law_1.2,1.1171199798583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,2,power_law_1.2,1.4861568450927733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,2,power_law_1.2,1.9238143920898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,balanced,23.744730631510418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,2,power_law_1.2,2.5642623901367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,2,power_law_1.2,3.766291046142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,2,power_law_1.2,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,2,power_law_1.2,4.257932662963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,2,power_law_1.2,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,2,power_law_1.2,0.09741439819335937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,balanced,0.07967466612656911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,2,power_law_1.2,6.495993804931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,2,power_law_1.2,0.13971840143203734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,balanced,0.10498133301734924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,2,power_law_1.2,0.17921279668807982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,balanced,0.1618666648864746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,2,power_law_1.2,12.831878662109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,2,power_law_1.2,0.28126718997955324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,balanced,0.29942933718363446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,balanced,0.5489333470662435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,2,power_law_1.2,0.31230080127716064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,balanced,0.7005386352539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,2,power_law_1.2,0.3300928115844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,balanced,0.7053759892781576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,2,power_law_1.2,0.3316031932830811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,balanced,0.7125013669331869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,balanced,0.7119626998901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,2,power_law_1.2,0.36520960330963137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,balanced,0.7075200080871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,2,power_law_1.2,0.38179199695587157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,balanced,0.7172586917877197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,balanced,0.7177013556162516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,2,power_law_1.2,0.4070144176483154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,balanced,0.7259253660837809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,2,power_law_1.2,0.4286208152770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,balanced,0.7418560187021891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,2,power_law_1.2,0.47349119186401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,balanced,0.7556373278299967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,balanced,0.7680799961090088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,2,power_law_1.2,0.5135744094848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,balanced,0.7885706424713135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,balanced,0.8896213372548422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,2,power_law_1.2,0.5022272109985352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,balanced,0.8955946763356527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,balanced,1.014906644821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,2,power_law_1.2,0.5589632034301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,balanced,1.1625920136769612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,balanced,0.0595360000928243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,2,power_law_1.2,0.6473087787628173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,balanced,1.4757067362467449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,balanced,0.07946666578451793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,2,power_law_1.2,0.712985610961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,balanced,0.11203199625015259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,balanced,0.18547733624776205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,balanced,1.682144006093343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,balanced,0.31915199756622314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,2,power_law_1.2,0.9000831604003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,balanced,0.3850346803665161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,2,power_law_1.2,1.1131648063659667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,balanced,0.3937386671702067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,balanced,0.39640533924102783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,2,power_law_1.2,1.4527296066284179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,balanced,2.8671305974324546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,balanced,0.4005653460820516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,balanced,0.09679466485977173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,2,power_law_1.2,1.8450559616088866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,balanced,0.4013599952061971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,balanced,0.4108373324076335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,balanced,0.10558399558067322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,2,power_law_1.2,2.6146175384521486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.060198402404785155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.07594879865646362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,balanced,0.42053866386413574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,balanced,0.14468266566594443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,balanced,0.20257065693537393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,balanced,2.9330453872680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.07064319849014282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,2,power_law_1.2,3.3648960113525392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,balanced,0.4250719944636027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.08997120261192322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,balanced,0.33504001299540204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.09499520063400269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,balanced,0.44304001331329346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.1298367977142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,balanced,0.4102986653645833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,2,power_law_1.2,5.104339218139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.1338047981262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,balanced,0.46324801445007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,balanced,0.42022931575775146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.21393280029296874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.18373759984970092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,balanced,0.4731146494547526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,balanced,0.42546133200327557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,2,power_law_1.2,7.053292846679687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.3022144079208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.01,0.28117120265960693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,balanced,0.43303465843200684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,balanced,0.4974506696065267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.5093696117401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.01,0.32179200649261475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,balanced,0.4395039876302083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,balanced,4.999333381652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,2,power_law_1.2,8.393292999267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,balanced,0.6267626682917277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.01,0.3307775974273682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,balanced,0.4522186517715454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.5572288036346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.01,0.3383807897567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,balanced,0.6065813302993774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.5760064125061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,balanced,0.46381866931915283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,2,power_law_1.2,12.832365417480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.01,0.35560319423675535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.58787841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,balanced,0.4787733157475789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,balanced,0.7742613156636556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.01,0.37531518936157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.595961618423462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,balanced,0.5119786659876505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.01,0.39394559860229494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.6432127952575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,balanced,0.8172640005747477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.01,0.41699838638305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,2,power_law_1.2,27.343960571289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.6673984050750732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,balanced,0.5490293502807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.01,0.41651201248168945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.6878655910491943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,balanced,5.590165456136067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.01,0.44250240325927737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,balanced,1.1145226955413818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.746995210647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.01,0.46160640716552737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.7808832168579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.01,0.508351993560791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.8226240158081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,balanced,1.3186399936676025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,balanced,0.5842826763788859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.82806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.01,0.5732096195220947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.9406975746154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,0.6168000221252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.9675647735595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,0.7467072010040283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.01,1.0970879554748536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,balanced,2.011413256327311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,0.8200575828552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.01,1.1758848190307618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,balanced,0.6478933493296305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,1.06245756149292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.01,1.4714176177978515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,1.4470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.01,2.0694847106933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,balanced,6.36619758605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,2.0045440673828123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.01,2.7488895416259767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,balanced,2.470442612965902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.01,3.5483329772949217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,2.4837888717651366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.01,4.772320175170899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,3.6504257202148436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,balanced,0.8121866385142008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.01,5.564761734008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,4.8180992126464846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,balanced,0.9309546947479248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.01,5.9237312316894535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.01,7.2826690673828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,balanced,1.2074133555094402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,balanced,3.8264748255411782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.01,9.015980529785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.01,11.015904235839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,balanced,1.4550612767537434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.01,17.781210327148436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,balanced,2.2140480677286782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.01,21.34649658203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,balanced,2.7290080388387046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,balanced,10.32215436299642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,balanced,4.687808036804199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,power_law_1.01,0.09259520173072815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,power_law_1.01,0.10561920404434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,balanced,4.054815928141276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,power_law_1.01,0.12117120027542114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,power_law_1.01,0.1630336046218872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.0757695972919464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,power_law_1.01,0.19918080568313598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,power_law_1.01,0.31493120193481444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,balanced,5.258581479390462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.11552640199661254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,power_law_1.01,0.352294397354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.19189759492874145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,balanced,5.4190718332926435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,power_law_1.01,0.36895360946655276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.27591040134429934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,power_law_1.01,0.380511999130249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.5010816097259522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,power_law_1.01,0.3983680009841919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.541811180114746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,power_law_1.01,0.42741122245788576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.5659647941589355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,power_law_1.01,0.4480703830718994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,balanced,7.541760126749675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.6215295791625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,power_law_1.01,0.48099842071533205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,power_law_1.01,0.5296127796173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.6163072109222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,power_law_1.01,0.5903039932250976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.662227201461792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.6520768165588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,power_law_1.01,0.6112512111663818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.705836820602417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,balanced,9.987701416015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.7598976135253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,power_law_1.01,0.6934847831726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,balanced,8.794928232828775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.7940480232238769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.8252096176147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.8651264190673829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,power_law_1.01,0.8166591644287109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,balanced,19.945850372314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.9672767639160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.01,0.9673664093017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.9895359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.01,1.2343551635742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,1,power_law_1.2,1.1310400009155273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.01,1.5122624397277833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,1,power_law_1.2,1.205561637878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.01,2.0917247772216796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,balanced,12.2150510152181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,1,power_law_1.2,1.5501055717468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.01,2.6779712677001952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,1,power_law_1.2,2.108492851257324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.01,3.8399871826171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,1,power_law_1.2,2.834752082824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.01,5.009215927124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,1,power_law_1.2,3.6654720306396484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.01,7.319084930419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,1,power_law_1.2,4.89024658203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.01,9.636454772949218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,1,power_law_1.2,6.009273529052734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.01,12.027078247070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,1,power_law_1.2,7.621849822998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,power_law_1.01,19.014764404296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,1,power_law_1.2,10.9302978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,balanced,19.57347234090169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,1,power_law_1.2,21.353721618652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,power_law_1.01,37.861856079101564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,balanced,17.56814956665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.05772160291671753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.09414399862289428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.12679040431976318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.17221120595932007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,1,power_law_1.2,0.2763967990875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,1,power_law_1.2,0.31303040981292723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,1,power_law_1.2,0.32598400115966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,1,power_law_1.2,0.3532991886138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,1,power_law_1.2,0.369049596786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,1,power_law_1.2,0.39341440200805666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,1,power_law_1.2,0.4023104190826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,1,power_law_1.2,0.42558717727661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,1,power_law_1.2,0.4237696170806885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,1,power_law_1.2,0.45747199058532717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,1,power_law_1.2,0.47976322174072267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,1,power_law_1.2,0.5197504043579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,1,power_law_1.2,0.5847487926483155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,0.6300735950469971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,0.769158411026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,balanced,39.90343475341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,0.84202880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,balanced,0.0813920001188914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,1.103660774230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,balanced,0.10149866342544556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,1.4851648330688476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,balanced,0.1518933375676473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,1,power_law_1.2,0.09351040124893188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,2.0441728591918946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,balanced,0.27192533016204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,1,power_law_1.2,0.10003199577331542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,2.5593727111816404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,1,power_law_1.2,0.1170240044593811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,balanced,0.4970826705296834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,1,power_law_1.2,0.15411839485168458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,balanced,0.9503680070241293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,1,power_law_1.2,0.19367680549621583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,3.8035839080810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,1,power_law_1.2,0.31510400772094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,1,power_law_1.2,0.3446912050247192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,5.0038398742675785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,balanced,1.4067145983378093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,1,power_law_1.2,0.37411839962005616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,1,power_law_1.2,0.3981055974960327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,balanced,1.404304027557373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,1,power_law_1.2,6.075059127807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,1,power_law_1.2,0.4127039909362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,1,power_law_1.2,0.44350080490112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,balanced,1.401312033335368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,1,power_law_1.2,0.4603775978088379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,1,power_law_1.2,9.070738983154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,balanced,1.4034612973531086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,1,power_law_1.2,0.4900928020477295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,1,power_law_1.2,0.5446335792541503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,balanced,1.404213269551595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,1,power_law_1.2,0.6021312236785888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,1,power_law_1.2,17.764268493652345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,balanced,1.4143625895182292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,balanced,1.4166879653930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,1,power_law_1.2,0.614246416091919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,balanced,1.3996213277180989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,balanced,1.414255936940511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,1,power_law_1.2,0.697817611694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,balanced,1.4184692700703938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,1,power_law_1.2,0.8285632133483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,balanced,1.4273600578308105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.2,0.971673583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.2,1.2455679893493652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,balanced,1.448186715443929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.2,1.5155967712402343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.2,2.0957183837890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,balanced,1.5063680013020833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.2,2.6882560729980467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,balanced,1.5458614031473796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.2,3.8564414978027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,balanced,0.07266666491826375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.2,5.006784057617187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,balanced,0.09989866614341736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,balanced,1.5833333333333333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,balanced,0.1612160007158915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.2,7.3411201477050785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,balanced,0.27620800336201984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,balanced,0.504800001780192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.2,9.646291351318359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,balanced,0.7420000235239664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,balanced,1.6432852745056152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,balanced,0.72980268796285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.2,11.93496322631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,balanced,0.7306826909383138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,balanced,0.7347040176391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,balanced,1.755568027496338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,balanced,0.7374453544616699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,1,power_law_1.2,18.93653106689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,balanced,0.7386933167775472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,balanced,0.7469493548075358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,balanced,0.7504106362660726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,balanced,1.8538932800292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,balanced,0.7617493470509847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,1,power_law_1.2,37.586630249023436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,balanced,0.7652053038279215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,balanced,0.7794026533762614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,balanced,0.8061172962188721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,balanced,2.0682026545206704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,balanced,0.8262560367584229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,balanced,0.8655573527018229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,balanced,0.9002559979756674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,balanced,2.313231945037842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,balanced,0.9687413374582926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,balanced,0.0647680014371872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.01,0.2737600088119507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,balanced,1.047887961069743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.1778496026992798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,balanced,0.07449600100517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.01,0.5048255920410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,balanced,0.11204800009727478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.01,0.2671488046646118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.01,0.9435327529907227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,balanced,0.1811359922091166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,balanced,1.1871039867401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.01,0.4962751865386963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,balanced,0.2996906638145447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,balanced,3.1000693639119468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.01,0.2628671884536743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,balanced,0.49489601453145343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.01,0.1592960000038147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.01,0.4358719825744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,balanced,0.7156053384145101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.01,0.22121601104736327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.01,0.6736256122589112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,balanced,0.7176106770833334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,balanced,1.3871679306030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.01,0.37010560035705564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,balanced,0.720192035039266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.01,0.7276671886444092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.01,0.4028480052947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,balanced,0.7234079837799072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.01,1.039468765258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,balanced,0.72597336769104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.01,0.4832320213317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,balanced,0.7314613660176595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.01,1.0559231758117675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.01,0.5410751819610595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,balanced,0.7355573177337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.01,0.5514560222625733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,balanced,1.6676586469014485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.01,1.1038463592529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,balanced,0.7423253059387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,balanced,4.030032157897949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,balanced,0.756981372833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.01,0.5834047794342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.01,1.0083840370178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,balanced,0.7612640062967936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.01,0.6008959770202636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.01,1.1106687545776368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,balanced,0.7789866924285889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.01,0.5971839904785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.01,1.0924223899841308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,balanced,0.808730681737264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.01,0.601529598236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.01,1.199392032623291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.01,0.6909696102142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,balanced,2.131648063659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.01,1.2337663650512696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.01,0.6975935935974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.01,1.2318528175354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.01,0.7161920070648193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.01,0.7440959930419921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.01,1.3250240325927733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,balanced,0.835477352142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,0.8227968215942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.01,1.4726079940795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,0.9613504409790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.01,1.774662399291992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,0.9538559913635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,power_law_1.01,0.17072639465332032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.01,2.019833564758301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,1.213926410675049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.01,1.9248319625854493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,balanced,5.491472244262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,balanced,2.7284587224324546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,1.221440029144287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,power_law_1.01,0.2805887937545776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.01,2.425017547607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,balanced,0.9058506488800049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,1.5226880073547364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,power_law_1.01,0.5020287990570068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.01,2.022208023071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,1.8942144393920899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,power_law_1.01,0.1510975956916809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,balanced,0.971834659576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.01,2.4951103210449217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,2.3301311492919923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,power_law_1.01,0.24917120933532716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.01,2.999910354614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,2.7419712066650392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,balanced,1.0825706322987874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,power_law_1.01,0.350931191444397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,8,power_law_1.2,0.29149439334869387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.01,3.7638145446777345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.01,3.378643035888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,8,power_law_1.2,0.4884672164916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,power_law_1.01,0.41701760292053225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,balanced,1.2069653669993083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.01,4.508652877807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.01,5.193983840942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,8,power_law_1.2,0.4290112018585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,power_law_1.01,0.4668288230895996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.01,5.609228897094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,8,power_law_1.2,0.24559359550476073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,power_law_1.01,0.5035520076751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.01,10.159852600097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,balanced,1.431968053181966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,8,power_law_1.2,0.4368127822875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,balanced,3.9387146631876626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.01,8.376268768310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,power_law_1.01,0.5415743827819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,8,power_law_1.2,0.54202880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,8,power_law_1.2,0.7136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,power_law_1.01,0.5696959972381592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.01,15.217587280273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,8,power_law_1.2,0.9044544219970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,balanced,1.9485333760579426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,power_law_1.01,0.5815423965454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,8,power_law_1.2,0.9781696319580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,power_law_1.01,0.6216896057128907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,8,power_law_1.2,0.9475584030151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,power_law_1.01,0.690393590927124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,8,power_law_1.2,1.0678208351135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,power_law_1.01,0.7338880062103271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,balanced,2.38808536529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,8,power_law_1.2,1.1004672050476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,power_law_1.01,0.7504384040832519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,8,power_law_1.2,1.152128028869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,power_law_1.01,0.8205696105957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,8,power_law_1.2,1.1630463600158691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,balanced,10.963877360026041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,power_law_1.01,0.9594816207885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,8,power_law_1.2,1.1187071800231934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,8,power_law_1.2,1.1795455932617187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.01,0.8939071655273437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,8,power_law_1.2,1.276038360595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,balanced,3.2705227533976235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,8,power_law_1.2,1.4338239669799804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,8,power_law_1.2,1.7031360626220704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.01,0.9629887580871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,8,power_law_1.2,2.1807424545288088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.01,1.127353572845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,8,power_law_1.2,1.9567167282104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.01,1.367155170440674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.1573248028755188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,8,power_law_1.2,2.6716287612915037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.01,1.4616512298583983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,8,power_law_1.2,2.3414400100708006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,8,power_law_1.2,0.26702721118927003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.01,1.9684415817260743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,8,power_law_1.2,0.26295039653778074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,balanced,7.556575775146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,balanced,4.29694398244222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,8,power_law_1.2,2.694163131713867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,8,power_law_1.2,0.1599679946899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.01,2.433363151550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,8,power_law_1.2,3.09881591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,8,power_law_1.2,0.23992960453033446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.01,3.4583934783935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,8,power_law_1.2,0.3288831949234009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,8,power_law_1.2,3.892038345336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,8,power_law_1.2,0.35423998832702636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,8,power_law_1.2,5.210655975341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.01,5.070259094238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,8,power_law_1.2,0.48480639457702634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,8,power_law_1.2,0.5062272071838378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,8,power_law_1.2,7.078790283203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,power_law_1.01,6.179193496704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,8,power_law_1.2,0.5271743774414063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,8,power_law_1.2,0.5614783763885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,8,power_law_1.2,8.859385681152343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,power_law_1.01,9.54922866821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,8,power_law_1.2,0.5912191867828369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,8,power_law_1.2,0.624512004852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,8,power_law_1.2,17.058905029296874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,8,power_law_1.2,0.6286719799041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,power_law_1.01,18.5603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,8,power_law_1.2,0.6708543777465821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,balanced,6.705434799194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,8,power_law_1.2,0.7217343807220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,8,power_law_1.2,0.7004928112030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,8,power_law_1.2,0.7997888088226318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,0.8717951774597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,1.0205504417419433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,1.0357888221740723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,1.2235520362854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,1.3713536262512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,1.5900287628173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,2.008064079284668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,2.4746559143066404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,3.3591487884521483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,8,power_law_1.2,4.47891845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,8,power_law_1.2,6.981702423095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,8,power_law_1.2,13.174642944335938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,balanced,13.41979726155599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,8,power_law_1.2,0.19001599550247192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,8,power_law_1.2,0.28095359802246095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,8,power_law_1.2,0.2130687952041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,8,power_law_1.2,0.15437439680099488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,8,power_law_1.2,0.2458751916885376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,8,power_law_1.2,0.30969600677490233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,balanced,0.07590400179227193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,8,power_law_1.2,0.37036159038543703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,balanced,0.10071999828020732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,balanced,0.15435733397801718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,8,power_law_1.2,0.495692777633667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,balanced,0.2783946593602498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,8,power_law_1.2,0.5015935897827148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,balanced,0.5073279937108358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,8,power_law_1.2,0.5512447834014893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,balanced,0.9827573299407959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,balanced,0.0584799995024999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,8,power_law_1.2,0.5224063873291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,balanced,1.4625439643859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,balanced,0.07377066711584727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,balanced,1.451327959696452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,8,power_law_1.2,0.6082687854766846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,balanced,0.10175466537475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,balanced,0.16159466902414957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,balanced,1.4597172737121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,8,power_law_1.2,0.590937614440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,balanced,0.27715200185775757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,balanced,1.4571946461995442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,balanced,0.503605326016744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,8,power_law_1.2,0.6400767803192139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,balanced,0.7379360198974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,balanced,1.4638932545979817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,8,power_law_1.2,0.6758399963378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,balanced,0.7391040325164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,balanced,1.4691200256347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,8,power_law_1.2,0.7154751777648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,balanced,0.7373706499735514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,balanced,1.472933292388916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,balanced,0.7428960005442301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,8,power_law_1.2,0.8117376327514648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,balanced,0.7477599779764811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,balanced,1.4453919728597004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,8,power_law_1.2,0.9865728378295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,balanced,0.7516640027364095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,balanced,1.4623252550760906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,balanced,0.7582399845123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,balanced,1.4696906407674153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,balanced,0.7629600365956625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.2,1.061023998260498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,balanced,0.7821599642435709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,balanced,1.483674685160319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,balanced,0.7817920049031576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,balanced,1.5213546752929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,balanced,0.8031253019968668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,balanced,1.5903894106547039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.2,1.056172752380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,balanced,0.8283147017161051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.2,1.2501248359680175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,balanced,0.8491946856180826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,balanced,1.6430452664693196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.2,1.6247615814208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,balanced,0.8977386951446533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,balanced,1.6666186650594075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.2,1.624563217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,balanced,0.9508533477783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.2,2.2113344192504885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,balanced,1.7585973739624023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.2,3.000294494628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,balanced,1.0509440104166667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.2,4.127865600585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,balanced,1.8956000010172527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.01,0.1739967942237854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,balanced,0.07489066819349925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,balanced,1.1592960357666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.01,0.10896639823913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.2,5.425164794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.01,0.26512000560760496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,balanced,0.08539199829101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.01,0.1560320019721985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,8,power_law_1.2,6.383340835571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.01,0.4914239883422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,balanced,0.11873066425323486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.01,0.27117440700531004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,balanced,2.0897706349690757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,balanced,0.187882661819458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,balanced,1.3534612655639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.01,0.22206079959869385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.01,0.14736640453338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,balanced,0.3078400095303853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,8,power_law_1.2,9.437728118896484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,balanced,0.5030346711476644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.01,0.4167424201965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.01,0.23432319164276122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,balanced,0.7256693045298258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.01,0.6118847846984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.01,0.32614400386810305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,balanced,0.7276159922281901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,balanced,2.2734667460123696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,balanced,1.6014026006062825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,8,power_law_1.2,23.146502685546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.01,0.7340799808502197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,balanced,0.7328159809112549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.01,0.3876800060272217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,balanced,0.737119992574056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.01,0.8863871574401856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.01,0.48067197799682615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,balanced,0.7419359683990479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.01,0.9910847663879394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.01,0.5158656120300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,balanced,0.7488106886545817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.01,0.5158656120300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.01,0.9949119567871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,balanced,0.7555359999338785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,balanced,0.7666133244832357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.01,0.557689619064331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,balanced,2.000394662221273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.01,1.0607808113098145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,balanced,2.6274986267089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,balanced,0.7826293309529623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.01,0.5816768169403076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.01,1.1309184074401855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,balanced,0.7930026849110922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.01,0.6008959770202636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.01,1.059455966949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,balanced,0.8119413057963053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.01,0.625926399230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.01,1.133471965789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.01,0.6769472122192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,balanced,0.8596159617106119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.01,1.205452823638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.01,0.7041215896606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.01,1.1831232070922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,balanced,2.5744959513346353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,balanced,3.3643147150675454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.01,0.6944255828857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.01,1.2385727882385253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.01,0.7648575782775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.01,1.3805695533752442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,balanced,0.9119253158569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.01,0.7972544193267822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.01,1.5541440010070802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,power_law_1.01,0.12192000150680542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.01,0.953337574005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.01,1.843449592590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,power_law_1.01,0.17937920093536378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.01,0.9699007987976074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.01,1.781657600402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,power_law_1.01,0.29035520553588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.01,1.1729023933410645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.01,2.177190399169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,power_law_1.01,0.15910400152206422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,4,power_law_1.2,0.17392640113830565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.01,1.177011203765869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,balanced,3.1841812133789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.01,2.029779243469238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,power_law_1.01,0.22933120727539064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,4,power_law_1.2,0.2653248071670532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.01,1.4736255645751952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,balanced,4.66979185740153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,power_law_1.01,0.34346880912780764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.01,2.45611515045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,4,power_law_1.2,0.2714240074157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,balanced,1.018293301264445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.01,1.8053760528564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,power_law_1.01,0.38855040073394775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,4,power_law_1.2,0.21676158905029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.01,2.7966079711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,balanced,1.1100746790568035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,power_law_1.01,0.48343682289123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,4,power_law_1.2,0.3865407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.01,2.487436866760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.01,3.5784767150878904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,4,power_law_1.2,0.5061183929443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,power_law_1.01,0.5138432025909424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.01,3.123660850524902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,balanced,1.2800959746042888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,4,power_law_1.2,0.5968512058258056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.01,4.384595108032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,power_law_1.01,0.5199872016906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,4,power_law_1.2,0.8282879829406739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,power_law_1.01,0.5577151775360107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.01,5.293689727783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.01,3.7081985473632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,4,power_law_1.2,0.912076759338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,power_law_1.01,0.5831168174743653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,balanced,1.4937012990315754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.01,7.402188873291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,4,power_law_1.2,0.9529919624328613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.01,5.558591842651367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,power_law_1.01,0.6246848106384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,power_law_1.01,0.6591231822967529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,4,power_law_1.2,1.0315135955810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,power_law_1.01,0.6939839839935302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.01,10.975692749023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,4,power_law_1.2,1.0608511924743653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,balanced,1.841002623240153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.01,17.057522583007813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,power_law_1.01,0.7322815895080567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,4,power_law_1.2,1.0731200218200683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,balanced,4.717893282572429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,power_law_1.01,0.7856768131256103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,4,power_law_1.2,1.1106240272521972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,balanced,6.248224258422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,power_law_1.01,0.9477760314941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,4,power_law_1.2,1.160159969329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,balanced,2.5571254094441733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,4,power_law_1.2,1.1989439964294433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,4,power_law_1.2,1.2678336143493651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,power_law_1.01,0.9591679573059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,4,power_law_1.2,1.3690688133239746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,4,power_law_1.2,1.5641471862792968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,power_law_1.01,1.0286656379699708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,4,power_law_1.2,1.8065343856811524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,4,power_law_1.2,1.902284812927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,power_law_1.01,1.1951871871948243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,balanced,3.322869300842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,power_law_1.01,1.549574375152588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,4,power_law_1.2,2.442732810974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,power_law_1.01,1.744767951965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,4,power_law_1.2,2.1689216613769533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,power_law_1.01,2.3159231185913085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,4,power_law_1.2,2.754560089111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,power_law_1.01,2.90067195892334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,4,power_law_1.2,3.0356927871704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,power_law_1.01,4.194662475585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,4,power_law_1.2,3.7480640411376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,balanced,4.4557491938273115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,power_law_1.01,5.255936050415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,4,power_law_1.2,4.851987075805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,power_law_1.01,6.7147773742675785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,4,power_law_1.2,6.680531311035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,4,power_law_1.2,8.917356872558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,power_law_1.01,10.225772857666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,power_law_1.2,19.577536010742186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,power_law_1.01,20.778790283203126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,balanced,5.778106689453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,balanced,9.201621373494467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,4,balanced,12.398452758789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,4,power_law_1.2,0.10919040441513062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,balanced,9.021450678507486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,4,power_law_1.2,0.155840003490448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,4,power_law_1.2,0.13983360528945923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,4,power_law_1.2,0.13434239625930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,4,power_law_1.2,0.22234880924224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,4,power_law_1.2,0.29668478965759276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,4,power_law_1.2,0.32496640682220457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,4,power_law_1.2,0.4646143913269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,4,power_law_1.2,0.483519983291626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,4,power_law_1.2,0.5322624206542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,4,power_law_1.2,0.5306240081787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,4,power_law_1.2,0.5688576221466064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,4,power_law_1.2,0.5897088050842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,4,power_law_1.2,0.6279808044433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,4,power_law_1.2,0.6656320095062256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,4,power_law_1.2,0.6955840110778808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,4,power_law_1.2,0.6807040214538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,4,power_law_1.2,0.7833600044250488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,4,power_law_1.2,0.8087167739868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,4,power_law_1.2,1.0114687919616698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,balanced,18.040693918863933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,4,power_law_1.2,1.0002495765686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,4,power_law_1.2,1.214361572265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,4,power_law_1.2,1.279097557067871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,4,power_law_1.2,1.6830463409423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,4,power_law_1.2,2.004416084289551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,balanced,0.07925333579381307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,4,power_law_1.2,2.6204351425170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,balanced,0.10127466917037964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,4,power_law_1.2,3.4338047027587892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,balanced,0.1548906664053599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,4,power_law_1.2,0.13007359504699706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,balanced,0.27188267310460407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,4,power_law_1.2,3.8537216186523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,balanced,0.5052853425343832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,4,power_law_1.2,0.17971199750900269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,balanced,0.9545866648356119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,4,power_law_1.2,6.4212158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,4,power_law_1.2,0.19199999570846557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,balanced,1.4161866505940754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,4,power_law_1.2,0.15374079942703248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,balanced,1.4297280311584473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,4,power_law_1.2,12.68081283569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,4,power_law_1.2,0.22230401039123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,balanced,1.4275306065877278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,4,power_law_1.2,0.30589439868927004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,balanced,1.4412533442179363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,4,power_law_1.2,0.3523904085159302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,balanced,1.4568853378295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,balanced,1.4559253056844075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,4,power_law_1.2,0.4695615768432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,balanced,1.4707040786743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,4,power_law_1.2,0.5063488006591796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,balanced,1.4654080073038738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,4,power_law_1.2,0.5213503837585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,balanced,1.4757013320922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,4,power_law_1.2,0.5548927783966064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,balanced,1.4860159556070964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,4,power_law_1.2,0.5796800136566163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,balanced,1.5011520385742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,4,power_law_1.2,0.6101568222045899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,balanced,1.5306240717569988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,4,power_law_1.2,0.6560959815979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,balanced,1.5900160471598308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,4,power_law_1.2,0.7046463966369629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,4,power_law_1.2,0.7417535781860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,balanced,1.6582239468892415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,4,power_law_1.2,0.8354432106018066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,balanced,1.7675894101460774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,4,power_law_1.2,0.9697792053222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,balanced,1.9430079460144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,4,power_law_1.2,1.0127167701721191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,balanced,2.072453339894613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,4,power_law_1.2,1.111961555480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,4,power_law_1.2,1.2287808418273927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,4,power_law_1.2,1.654649543762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,balanced,2.387669404347738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,balanced,0.06122133135795593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,balanced,0.07392533123493195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,4,power_law_1.2,1.8980415344238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.01,0.07693439722061157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.01,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,balanced,0.10223467151323955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,4,power_law_1.2,2.4213695526123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.01,0.10160640478134156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,balanced,0.16325333714485168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.01,0.15520000457763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.01,0.15394560098648072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,balanced,0.28389867146809894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,balanced,2.73857053120931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,4,power_law_1.2,3.106847953796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.01,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,balanced,0.5208106835683187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.01,0.12469760179519654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,balanced,0.7469013532002767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,4,power_law_1.2,4.657279968261719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.01,0.20867838859558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.01,0.2190016031265259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,balanced,0.7500267028808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.01,0.31756160259246824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.01,0.3780735969543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,4,power_law_1.2,5.578163146972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,balanced,0.7559519608815511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,balanced,0.1053013304869334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.01,0.3791680097579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,balanced,0.7660106817881266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.01,0.5843071937561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,balanced,0.11174399654070537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,4,power_law_1.2,7.385062408447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,balanced,0.768122673034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.01,0.47104640007019044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,balanced,3.4121440251668296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.01,0.6985343933105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,balanced,0.13991999626159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,balanced,0.7733973662058512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.01,0.5019711971282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,balanced,0.7802666823069254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,balanced,0.18864534298578897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.01,0.9008255958557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,4,power_law_1.2,11.517337799072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,balanced,0.7845919926961263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.01,0.5222335815429687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,balanced,0.32501333951950073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.01,0.9476032257080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,balanced,0.7957866986592611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,balanced,0.5333546797434489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.01,0.5730368137359619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,balanced,0.802069346110026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,balanced,0.768293301264445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.01,0.965004825592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.01,0.5764351844787597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,balanced,0.823029359181722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,4,power_law_1.2,25.142445373535157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,balanced,0.7739573319753011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.01,1.0476415634155274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,balanced,0.864565372467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.01,0.5913472175598145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,balanced,0.7809973557790121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.01,1.105196762084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,balanced,0.898026704788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,balanced,0.7839413483937582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.01,0.6488383769989013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,balanced,4.217909177144368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,balanced,0.7947999636332194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.01,1.1266495704650878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.01,0.6812672138214111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,balanced,0.9825973510742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,balanced,0.8062293529510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.01,1.154041576385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.01,0.7154367923736572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,balanced,1.0661386648813884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,balanced,0.8166666825612386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.01,1.1895999908447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.01,0.6969088077545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,balanced,0.8311733404795328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.01,1.242527961730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.01,0.7965312004089355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,balanced,1.2171093622843425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.01,1.2515775680541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,balanced,0.8516106605529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.01,0.8354880332946777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.01,1.3845248222351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,balanced,0.8688053290049235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.01,0.985478401184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.01,1.458137607574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,balanced,1.3618079821268718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,balanced,0.9184906482696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.01,1.0470656394958495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.01,1.6334911346435548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,balanced,5.608021418253581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,balanced,1.0084959665934246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.01,1.866988754272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.01,1.317427158355713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.01,2.107052803039551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,balanced,1.6656427383422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.01,1.4288960456848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.01,2.0877695083618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.01,1.7668352127075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.01,2.423481559753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.01,2.1318080902099608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,balanced,1.0934666792551677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.01,3.0497919082641602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.01,2.9009599685668945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,balanced,2.0611039797465005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.01,3.840403366088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.01,3.6834686279296873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.01,5.161734390258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.01,4.5771839141845705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,power_law_1.01,0.11918720006942748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.01,6.593778991699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.01,6.967123413085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,power_law_1.01,0.14468480348587037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,balanced,1.2903786500295003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,balanced,2.7621119817097983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.01,8.504447937011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,power_law_1.01,0.20403199195861815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.01,14.122317504882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,balanced,1.4535573323567708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,power_law_1.01,0.1623103976249695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,balanced,7.67410151163737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,power_law_1.01,0.24718079566955567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.01,18.323033142089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,power_law_1.01,0.34106879234313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,balanced,1.7426026662190754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,power_law_1.01,0.399782395362854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,power_law_1.01,0.5056575775146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,balanced,2.101312001546224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,balanced,3.5181118647257485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,power_law_1.01,0.5473599910736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,power_law_1.01,0.5845119953155518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,2,power_law_1.2,0.10812159776687622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,power_law_1.01,0.6059072017669678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,2,power_law_1.2,0.1552575945854187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,balanced,2.721914609273275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,power_law_1.01,0.6277696132659912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,2,power_law_1.2,0.18072320222854615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,power_law_1.01,0.6441984176635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,2,power_law_1.2,0.21897599697113038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,power_law_1.01,0.6909056186676026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,2,power_law_1.2,0.34330239295959475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,2,power_law_1.2,0.45934081077575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,power_law_1.01,0.7398464202880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,balanced,3.7136799494425454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,power_law_1.01,0.7932479858398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,2,power_law_1.2,0.5985472202301025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,balanced,4.401983896891276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,power_law_1.01,0.8708224296569824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,2,power_law_1.2,0.8902848243713379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,power_law_1.01,1.0501440048217774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,2,power_law_1.2,0.8958784103393554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,2,power_law_1.2,0.9489855766296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,power_law_1.01,1.0863615989685058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,2,power_law_1.2,1.0087103843688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,balanced,4.902810732523601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,2,power_law_1.2,1.0720831871032714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,2,power_law_1.2,1.0612095832824706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,power_law_1.01,1.2842368125915526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,2,power_law_1.2,1.1392191886901855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,power_law_1.01,1.4738304138183593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,2,power_law_1.2,1.1879424095153808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,power_law_1.01,1.9581184387207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,2,power_law_1.2,1.2255488395690919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,2,power_law_1.2,1.2399935722351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,power_law_1.01,2.2106815338134767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,2,power_law_1.2,1.4186880111694335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,balanced,6.651173273722331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,balanced,14.636975606282553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,power_law_1.01,3.0559616088867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,balanced,6.745850880940755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,2,power_law_1.2,1.4803647994995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,power_law_1.01,3.755807876586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,2,power_law_1.2,1.6902847290039062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,power_law_1.01,5.502361679077149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,2,power_law_1.2,1.8912063598632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,power_law_1.01,6.921017456054687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,2,power_law_1.2,2.3765823364257814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,power_law_1.01,8.970745849609376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,2,power_law_1.2,2.2707712173461916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,2,power_law_1.2,2.660051155090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,power_law_1.01,13.901612854003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,balanced,8.38209088643392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,2,power_law_1.2,3.2278785705566406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,2,power_law_1.2,4.25786247253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,power_law_1.01,27.848992919921876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,2,power_law_1.2,5.403404617309571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,2,power_law_1.2,6.578797149658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,2,power_law_1.2,9.499641418457031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,2,power_law_1.2,18.804524230957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,balanced,13.05233637491862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,2,power_law_1.2,0.0774399995803833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,balanced,13.291695912679037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,2,power_law_1.2,0.10184320211410522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,2,power_law_1.2,0.11252479553222657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,2,power_law_1.2,0.1283455967903137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,2,power_law_1.2,0.20970239639282226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,2,power_law_1.2,0.2896384000778198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,2,power_law_1.2,0.33596799373626707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,2,power_law_1.2,0.4516608238220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,2,power_law_1.2,0.4908927917480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,2,power_law_1.2,0.516864013671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,2,power_law_1.2,0.5501567840576171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,2,power_law_1.2,0.5647359848022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,2,power_law_1.2,0.5867392063140869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,2,power_law_1.2,0.6558464050292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,2,power_law_1.2,0.686188793182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,2,power_law_1.2,0.7323584079742431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,2,power_law_1.2,0.7265408039093018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,2,power_law_1.2,0.8405119895935058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,2,power_law_1.2,0.8917119979858399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,2,power_law_1.2,1.026591968536377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,2,power_law_1.2,1.1368639945983887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,balanced,0.07774400214354198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,balanced,25.370150248209637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,2,power_law_1.2,0.11425280570983887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,2,power_law_1.2,1.3697855949401856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,balanced,0.10249066352844238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,2,power_law_1.2,0.1445312023162842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,2,power_law_1.2,1.4813568115234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,balanced,0.15713066856066385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,balanced,0.27491732438405353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,2,power_law_1.2,0.16080000400543212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,2,power_law_1.2,1.8243135452270507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,balanced,0.5153599977493286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,2,power_law_1.2,0.15893759727478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,balanced,0.9681706428527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,2,power_law_1.2,2.215750312805176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,balanced,1.4259680112202961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,2,power_law_1.2,0.22665600776672362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,balanced,1.4403947194417317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,2,power_law_1.2,3.083628845214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,balanced,1.44048007329305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,2,power_law_1.2,0.2962368011474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,balanced,1.4622079531351726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,2,power_law_1.2,3.8600833892822264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,2,power_law_1.2,0.35516159534454345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,balanced,1.4712319374084473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,balanced,1.464431921641032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,2,power_law_1.2,4.71965446472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,2,power_law_1.2,0.5038911819458007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,balanced,1.4870559374491374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,2,power_law_1.2,0.5201856136322022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,balanced,1.494501272837321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,2,power_law_1.2,7.115257263183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,2,power_law_1.2,0.5522560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,balanced,1.5020747184753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,2,power_law_1.2,0.5822912216186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,balanced,1.4999626477559407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,2,power_law_1.2,14.263827514648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,2,power_law_1.2,0.6324607849121093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,balanced,1.5182773272196453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,2,power_law_1.2,0.6446847915649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,balanced,1.5860586166381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,2,power_law_1.2,0.6946239948272706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,balanced,1.6828746795654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,2,power_law_1.2,0.7676928043365479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,balanced,1.8139893213907878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,2,power_law_1.2,0.8132672309875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,balanced,1.9985225995381672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,2,power_law_1.2,0.8892736434936523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,balanced,2.271567980448405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,2,power_law_1.2,1.0964608192443848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,balanced,2.5348000526428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,2,power_law_1.2,1.1284031867980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,balanced,0.06573866804440816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,balanced,3.084335962931315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,2,power_law_1.2,1.328985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,balanced,0.08022400240103404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,balanced,0.10838933785756429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,2,power_law_1.2,1.545356845855713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,balanced,0.17378133535385132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,balanced,0.2966559926668803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,2,power_law_1.2,2.010028839111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,balanced,0.5411359866460165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,balanced,3.7684478759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,2,power_law_1.2,2.3725568771362306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,balanced,0.7817280292510986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,balanced,0.7881813049316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,2,power_law_1.2,3.204972839355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,balanced,0.8004960219065348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,balanced,0.8034826914469401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,2,power_law_1.2,4.115353775024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,balanced,0.812058687210083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,2,power_law_1.2,5.767219161987304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,balanced,0.8287999629974365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,balanced,5.168197313944499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,balanced,0.8412480354309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,2,power_law_1.2,7.870912170410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,balanced,0.8640213012695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,balanced,0.8874399662017822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,balanced,0.1662399967511495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,2,power_law_1.2,8.858118438720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,balanced,0.9195040067036947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,balanced,0.17340266704559326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.07797759771347046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,balanced,0.9471360047658285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,balanced,0.19709867238998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,2,power_law_1.2,15.036000061035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.1004032015800476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,balanced,1.0117759704589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,balanced,0.26131200790405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.15764479637145995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,balanced,0.36815468470255536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,balanced,1.0581440130869548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.19752960205078124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,balanced,6.061562856038411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,balanced,0.6156746546427408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.37770240306854247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,balanced,0.8791306813557943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,2,power_law_1.2,28.100741577148437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,balanced,1.1854453086853027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,balanced,0.8888426621754965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.6015488147735596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,balanced,0.8977866967519125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.674783992767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,balanced,1.3088640371958415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.06169599890708923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,balanced,0.9034026463826498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.9003007888793946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,balanced,0.9207946459452311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.9141183853149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.07594879865646362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,balanced,1.5121386845906575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.9942079544067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,balanced,0.9388533433278402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.10543999671936036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.01,1.0287872314453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,balanced,0.9565386772155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.13269120454788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.01,1.0797823905944823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,balanced,1.8136906623840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,balanced,0.9886879920959473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.01,1.1216832160949708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.2215872049331665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,balanced,7.291952133178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,balanced,1.0305546919504802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.01,1.159724807739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.01,0.33471360206604006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.01,1.1975040435791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,balanced,1.065381368001302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.01,0.39473919868469237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,balanced,2.386202653249105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.01,1.2431743621826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,balanced,1.1370666821797688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.01,0.49452800750732423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.01,1.2909055709838868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,balanced,1.2887252966562908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.01,0.5300159931182862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.01,1.4317567825317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.01,0.5516799926757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.01,1.533478355407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,balanced,2.977562586466471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.01,0.5922368049621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.01,1.7761728286743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.01,0.6213312149047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.01,2.007967948913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,balanced,1.4371573130289714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.01,2.3849536895751955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.01,0.6511040210723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.01,0.682809591293335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.01,2.6036096572875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.01,0.7363391876220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.01,3.3030975341796873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.01,0.7782400131225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,balanced,4.237514813741048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.01,4.275795364379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.01,0.8037055969238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.01,5.971763229370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,balanced,10.848052978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.01,0.9114944458007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,balanced,1.865594704945882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.01,6.090496063232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,1.0102335929870605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,balanced,2.1821279525756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,1.2272319793701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.01,7.416268920898437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,1.284620761871338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.01,11.092537689208985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,1.5792256355285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,balanced,2.628767967224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,1.7894464492797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,balanced,4.917605400085449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,2.295814323425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.01,23.931398010253908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,balanced,3.408320109049479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,3.083123207092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,4.312038421630859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,4.948774337768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,balanced,4.440117200215657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,power_law_1.01,0.1477952003479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.01,5.995532989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,power_law_1.01,0.16288000345230103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,power_law_1.01,0.1984063982963562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.01,9.285453033447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,balanced,6.081872304280599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,power_law_1.01,0.21311359405517577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,balanced,6.465311686197917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,power_law_1.01,0.3023616075515747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,power_law_1.01,0.3963007926940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.01,20.432960510253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,power_law_1.01,0.47712001800537107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,power_law_1.01,0.5909887790679932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,power_law_1.01,0.6261312007904053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,balanced,8.601898829142252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,power_law_1.01,0.6546175956726075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,power_law_1.01,0.7018239974975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.10069119930267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.1292736053466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,power_law_1.01,0.72740478515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.1966912031173706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,power_law_1.01,0.7635583877563477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.34551680088043213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.4820864200592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,power_law_1.01,0.8681856155395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,balanced,23.67681121826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,balanced,9.250602722167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.5998271942138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,power_law_1.01,0.96878080368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,balanced,11.773979187011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.8481087684631348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,power_law_1.01,0.9989376068115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.9214271545410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,power_law_1.01,1.1547072410583497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,power_law_1.01,1.4307519912719726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.9492351531982421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,1,power_law_1.2,1.0146495819091796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,1,power_law_1.2,1.0894463539123536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.01,1.569164752960205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,1,power_law_1.2,1.1378944396972657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,1,power_law_1.2,1.1752320289611817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.01,1.8130752563476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,1,power_law_1.2,1.194707202911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.01,2.1618816375732424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,balanced,14.665531158447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,1,power_law_1.2,1.2440447807312012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.01,2.886636734008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,1,power_law_1.2,1.3064448356628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.01,3.540140914916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,1,power_law_1.2,1.454099178314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,1,power_law_1.2,1.589971160888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.01,4.878464126586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,1,power_law_1.2,1.8611648559570313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.01,6.221395111083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,1,power_law_1.2,2.055404853820801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,1,power_law_1.2,2.434809684753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.01,8.800953674316407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,1,power_law_1.2,2.712819290161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.01,11.584928131103515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,1,power_law_1.2,3.362278366088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,1,power_law_1.2,4.532601547241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.01,14.145074462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.06183680295944214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,1,power_law_1.2,6.172915267944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.07616639733314515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,1,power_law_1.2,6.31146240234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.08857600092887878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,power_law_1.01,22.165190124511717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,balanced,22.708880106608074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.13196799755096436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,1,power_law_1.2,7.543328094482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.19534720182418824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,balanced,20.01099141438802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,1,power_law_1.2,11.196422576904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,1,power_law_1.2,0.28504960536956786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,power_law_1.01,43.2353271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,1,power_law_1.2,0.34454400539398194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,1,power_law_1.2,23.899781799316408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,1,power_law_1.2,0.49390082359313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,1,power_law_1.2,0.5103487968444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,1,power_law_1.2,0.5351808071136475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,1,power_law_1.2,0.5749055862426757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,1,power_law_1.2,0.610752010345459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,1,power_law_1.2,0.6494400024414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,1,power_law_1.2,0.6986688137054443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,1,power_law_1.2,0.7335360050201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,1,power_law_1.2,0.768671989440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,1,power_law_1.2,0.8268608093261719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,1,power_law_1.2,0.9232640266418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,1.0347007751464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,1.2512191772460937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,1.336569595336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,1.6156351089477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,1.8521663665771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,balanced,0.05823466678460439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,2.3932863235473634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,balanced,44.7296142578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,balanced,0.06307200094064076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,3.2666366577148436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,balanced,0.06937066713968913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,balanced,0.07546666761239369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,4.5170433044433596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,balanced,0.08850133419036865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,5.0177665710449215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,balanced,0.12566933035850525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,1,power_law_1.2,0.1440384030342102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,balanced,0.1276639997959137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,1,power_law_1.2,0.16056959629058837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,1,power_law_1.2,6.075878524780274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,balanced,0.12753066420555115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,1,power_law_1.2,0.18908159732818602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,balanced,0.12461333473523457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,1,power_law_1.2,9.389190673828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,1,power_law_1.2,0.21850240230560303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,balanced,0.1263040006160736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,1,power_law_1.2,0.27555840015411376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,balanced,0.12585066755612692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,1,power_law_1.2,0.3542335987091064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,1,power_law_1.2,20.13173065185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,balanced,0.16942399740219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,1,power_law_1.2,0.42024960517883303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,1,power_law_1.2,0.5509952068328857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,balanced,0.16825600465138754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,power_law_1.01,0.10331519842147827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,1,power_law_1.2,0.5933248043060303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,balanced,0.1673706571261088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,power_law_1.01,0.13264000415802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,1,power_law_1.2,0.6160895824432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,balanced,0.2969546715418498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,power_law_1.01,0.09550719857215881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,1,power_law_1.2,0.6668543815612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,balanced,0.29546133677164715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,power_law_1.01,0.07429760098457336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,1,power_law_1.2,0.7188672065734864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,balanced,0.29517332712809247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,power_law_1.01,0.08543360233306885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,1,power_law_1.2,0.7488831996917724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,power_law_1.01,0.09784319996833801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,balanced,0.29444799820582074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,1,power_law_1.2,0.8368320465087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,power_law_1.01,0.11006079912185669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,1,power_law_1.2,0.9139583587646485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,balanced,0.2982826630274455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,power_law_1.01,0.118777596950531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,1,power_law_1.2,0.9844160079956055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,balanced,0.30158400535583496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,power_law_1.01,0.11414400339126587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,1,power_law_1.2,1.1371264457702637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,balanced,0.312336007754008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,power_law_1.01,0.11904640197753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,1,power_law_1.2,1.4003264427185058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,power_law_1.01,0.12092159986495972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,balanced,0.3356586694717407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,power_law_1.01,0.16874879598617554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,power_law_1.01,0.15879039764404296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.2,1.5286272048950196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,balanced,0.3600533405939738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,power_law_1.01,0.16839040517807008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,power_law_1.01,0.30046079158782957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.2,1.8339008331298827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,balanced,0.6344159841537476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,power_law_1.01,0.2918528079986572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.2,2.184454345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,power_law_1.01,0.2801471948623657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.2,2.9151424407958983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,power_law_1.01,0.30636160373687743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,balanced,0.6807200113932291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,power_law_1.01,0.355347204208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.2,3.5065471649169924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,power_law_1.01,0.3904128074645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.2,4.871212768554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,power_law_1.01,0.45288958549499514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,power_law_1.01,0.539731216430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.2,6.172057723999023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,balanced,0.9992907047271729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,power_law_1.01,0.7102464199066162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.2,8.84988784790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,power_law_1.01,0.9703359603881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.2,11.450374603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,power_law_1.01,1.1161279678344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,balanced,1.3242080211639404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,power_law_1.01,1.6292863845825196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.2,14.116166687011718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,power_law_1.01,2.506284713745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,balanced,0.04888000090916952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,8,power_law_1.2,0.10313600301742554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,1,power_law_1.2,22.055416870117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,power_law_1.01,2.6618112564086913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,power_law_1.01,0.0732479989528656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,balanced,0.053957333167394005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,8,power_law_1.2,0.11910400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,power_law_1.01,3.9050113677978517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,balanced,0.05702400207519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,power_law_1.01,0.09198079705238342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,balanced,1.6404587427775066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,8,power_law_1.2,0.08393599987030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,balanced,0.07411733269691467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,power_law_1.01,0.06791679859161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,8,power_law_1.2,0.08095359802246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,power_law_1.01,8.810336303710937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,balanced,0.08546666304270427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,power_law_1.01,0.07416319847106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,8,power_law_1.2,0.08390399813652039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,1,power_law_1.2,43.340826416015624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,balanced,0.12407466769218445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,power_law_1.01,0.07971839904785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,balanced,0.12544000148773193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,8,power_law_1.2,0.09031040072441102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,balanced,0.12592533230781555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,power_law_1.01,0.08433279991149903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,8,power_law_1.2,0.1206976056098938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,balanced,0.12598400314648947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,power_law_1.01,0.10493439435958862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,8,power_law_1.2,0.11759359836578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,balanced,0.12681066989898682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,power_law_1.01,0.10927360057830811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,balanced,0.12878933548927307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,8,power_law_1.2,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,balanced,2.5941173235575357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,balanced,0.12930666406949362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,power_law_1.01,0.11246720552444459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,8,power_law_1.2,0.11461759805679321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,balanced,0.12967999776204428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,power_law_1.01,0.12065919637680053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,balanced,0.1302773356437683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,8,power_law_1.2,0.12142080068588257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,power_law_1.01,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,balanced,0.1657866636912028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,8,power_law_1.2,0.16605440378189087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,power_law_1.01,0.11879040002822876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,balanced,0.16395200292269388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,8,power_law_1.2,0.16880639791488647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,power_law_1.01,0.12410880327224731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,balanced,0.1653279960155487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,8,power_law_1.2,0.17248640060424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,power_law_1.01,0.12695679664611817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,balanced,0.31434667110443115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,8,power_law_1.2,0.31086719036102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,power_law_1.01,0.16581759452819825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,balanced,0.31758399804433185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,power_law_1.01,0.1691200017929077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,8,power_law_1.2,0.3167680025100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,power_law_1.01,0.18747520446777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,8,power_law_1.2,0.32943999767303467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,balanced,0.3216853340466817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,power_law_1.01,0.3155263900756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,8,power_law_1.2,0.36353919506072996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,power_law_1.01,0.3591552019119263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,balanced,0.3306186596552531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,8,power_law_1.2,0.38508799076080324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,4,power_law_1.2,0.07203840017318726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,8,power_law_1.2,0.43065600395202636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,power_law_1.01,0.40529279708862304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,balanced,0.351962685585022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,4,power_law_1.2,0.08598399758338929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,8,power_law_1.2,0.5269567966461182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,power_law_1.01,0.4477695941925049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,8,power_law_1.2,0.6188864231109619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,4,power_law_1.2,0.0702015995979309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,balanced,5.147295951843262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,balanced,0.3744693199793498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,power_law_1.01,0.5306047916412353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,8,power_law_1.2,0.8249216079711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,4,power_law_1.2,0.07528960108757018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,power_law_1.01,0.6951104164123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,8,power_law_1.2,1.1076607704162598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,4,power_law_1.2,0.08218880295753479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,balanced,0.6664586861928304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,8,power_law_1.2,1.3684608459472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,power_law_1.01,0.7980671882629394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,4,power_law_1.2,0.08464000225067139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,8,power_law_1.2,2.049260711669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,power_law_1.01,1.0719488143920899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,4,power_law_1.2,0.09681919813156128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,8,power_law_1.2,2.866841506958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,balanced,0.7109173138936361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,power_law_1.01,1.4535679817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,4,power_law_1.2,0.108787202835083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,8,power_law_1.2,3.143116760253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,4,power_law_1.2,0.11338880062103271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,power_law_1.01,2.0016191482543944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,8,power_law_1.2,5.2563518524169925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,4,power_law_1.2,0.11422079801559448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,balanced,1.0484800338745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,power_law_1.01,2.486534309387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,4,power_law_1.2,0.11705600023269654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,8,power_law_1.2,10.709343719482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,balanced,0.03516799956560135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,power_law_1.01,3.571718215942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,4,power_law_1.2,0.11696640253067017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,balanced,0.03991466760635376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,4,power_law_1.2,0.12474240064620971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,power_law_1.01,7.394579315185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,balanced,0.04444266855716705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,balanced,1.386122703552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,4,power_law_1.2,0.1278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,balanced,0.06898666421572368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,4,power_law_1.2,0.17466239929199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,4,power_law_1.2,0.18680959939956665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,balanced,0.08785067001978557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,4,power_law_1.2,0.19701119661331176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,balanced,0.12453866998354594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,balanced,1.7280373573303223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,4,power_law_1.2,0.3529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,balanced,0.12587733070055643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,4,power_law_1.2,0.38207359313964845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,balanced,0.1262986660003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,balanced,0.1260586678981781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,4,power_law_1.2,0.4280831813812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,balanced,0.12638399998346964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,4,power_law_1.2,0.5063936233520507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,balanced,0.12734400232632956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,4,power_law_1.2,0.5828159809112549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,balanced,0.12769066294034323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,4,power_law_1.2,0.7096447944641113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,balanced,2.731306711832682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,balanced,0.13134933511416116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,4,power_law_1.2,0.9858048439025879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,balanced,0.13343999783198038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,4,power_law_1.2,1.2255295753479003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,balanced,0.134853333234787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,4,power_law_1.2,1.768819236755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,balanced,0.1370560030142466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,4,power_law_1.2,2.3048255920410154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,balanced,0.13886933525403342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,4,power_law_1.2,2.716671943664551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,balanced,0.17466133832931519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,balanced,0.18010133504867554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,4,power_law_1.2,3.5993152618408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,balanced,0.3417653242746989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,power_law_1.2,8.239564514160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,balanced,0.352234681447347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,balanced,0.3749973376592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,4,balanced,5.372149149576823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,balanced,0.4002186854680379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,balanced,0.7075146834055582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,balanced,0.7541653315226237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,balanced,1.1070240338643391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,power_law_1.01,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,2,power_law_1.2,0.03562879860401154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,power_law_1.01,0.043263998627662656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,power_law_1.01,0.044172799587249754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,2,power_law_1.2,0.04259200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,power_law_1.01,0.06410880088806152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,2,power_law_1.2,0.045721599459648134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,balanced,1.4590773582458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,power_law_1.01,0.07033600211143494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,2,power_law_1.2,0.06151679754257202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,power_law_1.01,0.08332160115242004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,2,power_law_1.2,0.0686016023159027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,power_law_1.01,0.09938560128211975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,2,power_law_1.2,0.08001919984817504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,power_law_1.01,0.10670720338821411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,2,power_law_1.2,0.09621760249137878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,power_law_1.01,0.106278395652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,balanced,1.81059726079305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,2,power_law_1.2,0.09588479995727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,power_law_1.01,0.11498240232467652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,power_law_1.01,0.12046719789505005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,2,power_law_1.2,0.10679039955139161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,2,power_law_1.2,0.1147007942199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,power_law_1.01,0.11733759641647339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,power_law_1.01,0.11640959978103638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,2,power_law_1.2,0.11528960466384888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,power_law_1.01,0.13059840202331544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,2,power_law_1.2,0.11957119703292847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,power_law_1.01,0.13435519933700563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,2,power_law_1.2,0.12295680046081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,power_law_1.01,0.14361599683761597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,2,power_law_1.2,0.13441280126571656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,balanced,2.877786636352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,power_law_1.01,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,2,power_law_1.2,0.13576960563659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,power_law_1.01,0.20965759754180907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,2,power_law_1.2,0.1464192032814026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,power_law_1.01,0.22332160472869872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,2,power_law_1.2,0.16008960008621215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,power_law_1.01,0.40491518974304197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,power_law_1.01,0.433241605758667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,2,power_law_1.2,0.21653759479522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,power_law_1.01,0.5207359790802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,2,power_law_1.2,0.23164799213409423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,balanced,0.028207999964555103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,power_law_1.01,0.6300992012023926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,2,power_law_1.2,0.43224320411682127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,power_law_1.01,0.8246527671813965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,balanced,0.03309866786003113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,2,power_law_1.2,0.47144317626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,power_law_1.01,1.0167872428894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,balanced,0.038693333665529885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,2,power_law_1.2,0.554911994934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,power_law_1.01,1.3833024024963378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,2,power_law_1.2,0.6964608192443847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,power_law_1.01,1.8251712799072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,power_law_1.01,2.278886413574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,2,power_law_1.2,0.8806271553039551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,balanced,0.08559999863306682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,balanced,0.12550933162371317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,2,power_law_1.2,1.1075967788696288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,power_law_1.01,3.284147262573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,balanced,0.12502933541933695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,2,power_law_1.2,1.3970815658569335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,balanced,5.694480260213216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,power_law_1.01,6.81628189086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,balanced,0.1251359979311625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,power_law_1.01,0.03244799971580505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,2,power_law_1.2,1.9087295532226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,balanced,0.1262506643931071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,1,power_law_1.2,0.02784000039100647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,balanced,0.12574399511019388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,power_law_1.01,0.03675520122051239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,2,power_law_1.2,2.478086471557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,1,power_law_1.2,0.03206399977207184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,balanced,0.1276533305644989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,power_law_1.01,0.05199360251426697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,1,power_law_1.2,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,2,power_law_1.2,3.40079345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,balanced,0.12788266936937967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,1,power_law_1.2,0.05063040256500244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,power_law_1.01,0.06877440214157104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,balanced,0.13099199533462524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,1,power_law_1.2,0.06133120059967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,power_law_1.01,0.07913600206375122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,2,power_law_1.2,6.989746856689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,balanced,0.13541866342226663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,1,power_law_1.2,0.07372159957885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,power_law_1.01,0.09170560240745544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,balanced,0.13614933689435324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,1,power_law_1.2,0.09339519739151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,power_law_1.01,0.0988864004611969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,1,power_law_1.2,0.09852799773216248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,balanced,0.13845866918563843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,power_law_1.01,0.1071936011314392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,1,power_law_1.2,0.10668799877166749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,balanced,0.14267733693122864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,power_law_1.2,0.10667519569396973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,1,power_law_1.01,0.10911999940872193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,balanced,0.1516693333784739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,power_law_1.2,0.11204479932785034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,1,power_law_1.01,0.11503360271453858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,power_law_1.2,0.11471359729766846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,balanced,0.1584106683731079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,1,power_law_1.01,0.11350400447845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,power_law_1.2,0.11458560228347778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,balanced,0.2070186734199524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,1,power_law_1.01,0.11849600076675415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,power_law_1.2,0.1281216025352478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,power_law_1.2,0.1346560001373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,1,power_law_1.01,0.12054400444030762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,balanced,0.22395733992258707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,power_law_1.2,0.15113600492477416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,power_law_1.2,0.17003519535064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,1,power_law_1.01,0.1330623984336853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,balanced,0.4180266857147217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,power_law_1.2,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,1,power_law_1.01,0.14617600440979003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,power_law_1.2,0.21445760726928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,balanced,0.4489813248316447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,1,power_law_1.01,0.1686911940574646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,power_law_1.2,0.2831295967102051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,1,power_law_1.01,0.18355200290679932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,power_law_1.2,0.325708794593811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,balanced,0.7847786744435629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,1,power_law_1.01,0.21086719036102294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,power_law_1.2,0.5935872077941895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,power_law_1.2,0.6829951763153076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,1,power_law_1.01,0.27414400577545167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,balanced,0.8388000329335531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,power_law_1.2,0.8778688430786132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,1,power_law_1.01,0.3079551935195923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,power_law_1.2,1.0730879783630372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,1,power_law_1.01,0.5731776237487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,power_law_1.2,1.4461119651794434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,1,power_law_1.01,0.6594624042510986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,balanced,1.2247200012207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,power_law_1.2,1.840403175354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,1,power_law_1.01,0.8644607543945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,power_law_1.2,2.2243967056274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,1,power_law_1.01,1.0352319717407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,balanced,0.05796800057093302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,power_law_1.2,3.3583297729492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,power_law_1.01,0.08218880295753479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,1,power_law_1.01,1.431603240966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,power_law_1.2,6.42577896118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,balanced,1.611087958017985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,1,power_law_1.01,1.7945215225219726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,balanced,0.058933332562446594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,power_law_1.01,0.07486079931259156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,power_law_1.01,2.2065408706665037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,power_law_1.01,3.331635284423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,balanced,0.062368000547091164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,power_law_1.01,0.08330879807472229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,1,balanced,1.9971359570821126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,power_law_1.01,6.445747375488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,balanced,0.060319999853769936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,power_law_1.01,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,balanced,0.07273600002129872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,power_law_1.01,0.07123839855194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,1,balanced,3.1547892888387046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,balanced,0.0783786674340566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,power_law_1.01,0.07769600152969361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,power_law_1.01,0.08065919876098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,balanced,0.079434668024381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,power_law_1.01,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,power_law_1.01,0.11945600509643554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,balanced,0.07941333452860515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,power_law_1.01,0.11729919910430908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,balanced,0.11379200220108032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,power_law_1.01,0.11719039678573609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,balanced,0.11345066626866658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,power_law_1.01,0.12215679883956909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,balanced,0.11395200093587239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,power_law_1.01,0.12017920017242431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,power_law_1.01,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,balanced,0.1130560040473938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,1,balanced,6.237301508585612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,power_law_1.01,0.11464320421218872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,balanced,0.1130400002002716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,power_law_1.01,0.14538880586624145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,balanced,0.1139359970887502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,power_law_1.01,0.18261760473251343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,balanced,0.11369599898656209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,power_law_1.01,0.19586559534072875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,power_law_1.01,0.24012160301208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,balanced,0.11557333668073018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,power_law_1.01,0.30965120792388917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,balanced,0.11645866433779399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,8,power_law_1.2,0.07979519963264466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,power_law_1.01,0.3744127988815308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,balanced,0.1195093293984731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,8,power_law_1.2,0.06172159910202026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,power_law_1.01,0.6494080066680908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,power_law_1.01,0.8051456451416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,8,power_law_1.2,0.07465599775314331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,balanced,0.1222879985968272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,power_law_1.01,1.2324416160583496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,balanced,0.046480000019073486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,8,power_law_1.2,0.06218240261077881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,balanced,0.19163199265797934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,power_law_1.01,1.4042688369750977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,8,power_law_1.2,0.0711359977722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,power_law_1.01,1.9538047790527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,balanced,0.2021119991938273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,balanced,0.05199466645717621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,8,power_law_1.2,0.07850880026817322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,power_law_1.01,3.093267250061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,balanced,0.29494933287302655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,power_law_1.01,4.350054550170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,8,power_law_1.2,0.08305280208587647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,balanced,0.05805333455403646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,power_law_1.01,0.06385279893875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,8,power_law_1.2,0.08323839902877808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,power_law_1.01,6.080940628051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,balanced,0.34907201925913495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,balanced,0.06631466746330261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,8,power_law_1.2,0.12069120407104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,power_law_1.01,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,balanced,0.05841066439946493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,power_law_1.01,13.311436462402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,power_law_1.01,0.0645695984363556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,8,power_law_1.2,0.11969280242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,balanced,0.5201333363850912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,balanced,0.058677335580190025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,8,power_law_1.2,0.12128000259399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,power_law_1.01,0.06753280162811279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,balanced,0.06262933214505513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,8,power_law_1.2,0.11959680318832397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,power_law_1.01,0.05686399936676025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,balanced,0.06281066437562306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,8,power_law_1.2,0.11610879898071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,balanced,0.06984533369541168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,power_law_1.01,0.057126402854919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,balanced,0.6689653396606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,balanced,0.0699839989344279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,8,power_law_1.2,0.12046719789505005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,power_law_1.01,0.06417279839515685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,balanced,0.07045333087444305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,8,power_law_1.2,0.1637760043144226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,power_law_1.01,0.06382719874382019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,balanced,0.11801066994667053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,8,power_law_1.2,0.17701120376586915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,power_law_1.01,0.07542399764060974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,balanced,0.11812800168991089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,balanced,0.9882986545562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,8,power_law_1.2,0.18492799997329712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,power_law_1.01,0.07657600045204163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,balanced,0.11860799789428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,8,power_law_1.2,0.2078336000442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,power_law_1.01,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,balanced,0.11859200398127238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,8,power_law_1.2,0.2773632049560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,power_law_1.01,0.1217919945716858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,balanced,0.12044266859690349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,8,power_law_1.2,0.38382720947265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,power_law_1.01,0.12294399738311768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,balanced,0.12109333276748657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,balanced,1.3074346383412678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,8,power_law_1.2,0.5357759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,balanced,0.12525332967440286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,power_law_1.01,0.12346240282058715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,8,power_law_1.2,0.7246335983276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,power_law_1.01,0.1289791941642761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,balanced,0.12788800398508707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,8,power_law_1.2,1.0999615669250489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,power_law_1.01,0.13738880157470704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,balanced,0.18263999621073404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,8,power_law_1.2,1.4617600440979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,power_law_1.01,0.14880640506744386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,balanced,0.19357866048812866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,8,power_law_1.2,2.236345672607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,balanced,1.6225813229878743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,power_law_1.01,0.17891199588775636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,8,power_law_1.2,2.8241855621337892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,balanced,0.291594664255778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,power_law_1.01,0.1948415994644165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,power_law_1.01,0.27395200729370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,8,power_law_1.2,4.4624897003173825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,balanced,0.3636106650034587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,power_law_1.01,0.344268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,8,power_law_1.2,6.368857574462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,power_law_1.01,0.4555327892303467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,balanced,0.5331039826075236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,power_law_1.01,0.5973440170288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,power_law_1.2,8.890016174316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,power_law_1.01,0.9069631576538086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,8,balanced,2.581397374471029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,balanced,0.7009867032368978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,power_law_1.01,1.3215871810913087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,power_law_1.2,18.735136413574217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,4,power_law_1.2,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,power_law_1.01,1.6311616897583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,balanced,0.034234667817751564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,4,power_law_1.2,0.06666240096092224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,power_law_1.01,2.058220863342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,balanced,0.039877332746982574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,4,power_law_1.2,0.07260159850120544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,balanced,1.0357759793599446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,power_law_1.01,2.8542207717895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,4,power_law_1.2,0.0692736029624939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,balanced,0.042730664213498436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,power_law_1.01,4.186124801635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,4,power_law_1.2,0.05666559934616089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,balanced,0.06578133503595988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,4,power_law_1.2,0.059443199634552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,power_law_1.01,7.762028503417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,balanced,0.06047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,4,power_law_1.2,0.0646399974822998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,balanced,1.371455987294515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,balanced,0.05880000193913778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,4,power_law_1.2,0.06443520188331604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,balanced,0.0590826670328776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,balanced,0.06002666552861532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,4,power_law_1.2,0.07439360022544861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,balanced,0.06089599927266439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,4,power_law_1.2,0.07247999906539918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,balanced,0.0611413319905599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,4,power_law_1.2,0.07405440211296081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,balanced,0.06182933350404104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,8,balanced,5.15995724995931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,balanced,0.07308800021807353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,4,power_law_1.2,0.1221119999885559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,balanced,1.7045653661092122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,balanced,0.07246933380762736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,4,power_law_1.2,0.12247040271759033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,balanced,0.07302933434645335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,balanced,0.11360533038775127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,4,power_law_1.2,0.12613760232925414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,balanced,0.11592533191045125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,4,power_law_1.2,0.1316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,balanced,0.11646399895350139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,4,power_law_1.2,0.1437376022338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,balanced,0.12080533305803935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,balanced,0.12482133507728577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,4,power_law_1.2,0.1600640058517456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,balanced,0.19346133867899576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,4,power_law_1.2,0.18247679471969605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,power_law_1.01,0.03460479974746704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,balanced,0.20500266551971436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,4,power_law_1.2,0.2131903886795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,balanced,2.7196213404337564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,balanced,0.3049866755803426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,power_law_1.01,0.040057599544525146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,4,power_law_1.2,0.2610879898071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,power_law_1.01,0.0417279988527298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,balanced,0.3878186543782552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,4,power_law_1.2,0.40782718658447265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,power_law_1.01,0.05516800284385681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,4,power_law_1.2,0.47957119941711424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,balanced,0.5666186809539795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,power_law_1.01,0.058924800157546996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,4,power_law_1.2,0.7118207931518554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,power_law_1.01,0.058220797777175905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,4,power_law_1.2,0.9712512016296386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,power_law_1.01,0.06347519755363465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,balanced,0.7433119614919027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,4,power_law_1.2,1.265497589111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,power_law_1.01,0.06599680185317994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,power_law_1.01,0.07044479846954346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,4,power_law_1.2,2.268070411682129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,power_law_1.01,0.07402880191802978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,balanced,1.0945119857788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,4,power_law_1.2,2.9930496215820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,power_law_1.01,0.07479680180549622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,4,power_law_1.2,3.306252670288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,power_law_1.01,0.07596160173416137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,4,power_law_1.2,5.402259063720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,power_law_1.01,0.07684479951858521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,2,power_law_1.2,0.034195199608802795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,balanced,5.3342132568359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,balanced,1.4355786641438801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,power_law_1.01,0.08057600259780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,2,power_law_1.2,0.04082559943199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,4,power_law_1.2,10.384620666503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,power_law_1.01,0.13299200534820557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,2,power_law_1.2,0.043398401141166686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,power_law_1.01,0.1355839967727661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,2,power_law_1.2,0.05111039876937866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,2,power_law_1.2,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,power_law_1.01,0.13967360258102418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,2,power_law_1.2,0.05802879929542541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,power_law_1.01,0.17047040462493895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,balanced,1.7841599782307942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,2,power_law_1.2,0.06147199869155884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,power_law_1.01,0.19445120096206664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,2,power_law_1.2,0.06639360189437866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,power_law_1.01,0.238700795173645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,2,power_law_1.2,0.0686464011669159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,2,power_law_1.2,0.07394559979438782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,power_law_1.01,0.29762558937072753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,2,power_law_1.2,0.07484800219535828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,power_law_1.01,0.4356991767883301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,2,power_law_1.2,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,2,power_law_1.2,0.07693439722061157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,power_law_1.01,0.5016575813293457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,2,power_law_1.2,0.08542720079421998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,power_law_1.01,0.6948287963867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,balanced,2.8436158498128257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,2,power_law_1.2,0.13388799428939818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,2,power_law_1.2,0.13722239732742308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,power_law_1.01,0.9109760284423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,2,power_law_1.2,0.1486400008201599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,power_law_1.01,1.3975616455078126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,2,power_law_1.2,0.17229440212249755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,2,power_law_1.2,0.19331200122833253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,power_law_1.01,1.8484159469604493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,2,power_law_1.2,0.261900806427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,power_law_1.01,2.2960384368896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,2,power_law_1.2,0.3050559997558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,2,power_law_1.2,0.41665282249450686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,power_law_1.01,3.45863037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,2,power_law_1.2,0.5560192108154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,2,power_law_1.2,0.7310783863067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,power_law_1.01,7.103526306152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,2,power_law_1.2,0.9931455612182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,2,power_law_1.2,1.3888959884643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,2,power_law_1.2,1.7395263671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,2,power_law_1.2,2.5857471466064452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,2,power_law_1.2,3.910905456542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,balanced,5.641658782958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,2,power_law_1.2,7.1595458984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,balanced,0.027850667635599773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,balanced,0.031717332700888314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,balanced,0.03722133239110311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,balanced,0.05795200169086456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,balanced,0.05959466596444448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,power_law_1.01,0.02714880108833313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,balanced,0.054986665646235146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,power_law_1.01,0.030220800638198854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,power_law_1.01,0.03445119857788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,balanced,0.05420266588528951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,balanced,0.05458133419354757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,power_law_1.01,0.04197759926319122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,balanced,0.05485333502292633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,power_law_1.01,0.056652802228927615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,balanced,0.05508266886075338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,balanced,0.05507733424504598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,power_law_1.01,0.05377280116081238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,balanced,0.058821335434913635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,power_law_1.01,0.05403519868850708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,balanced,0.0588266650835673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,1,power_law_1.2,0.027327999472618103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,power_law_1.01,0.05447040200233459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,balanced,0.0605973352988561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,balanced,0.07043200234572093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,power_law_1.01,0.05862399935722351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,1,power_law_1.2,0.030316799879074097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,balanced,0.07172266642252605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,power_law_1.01,0.06353279948234558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,balanced,0.07456533114115398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,1,power_law_1.2,0.033907198905944826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,balanced,0.12733866771062216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,power_law_1.01,0.06898559927940369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,1,power_law_1.2,0.04209280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,balanced,0.13265599807103476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,power_law_1.01,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,1,power_law_1.2,0.05720319747924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,balanced,0.212501327196757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,power_law_1.01,0.07207040190696716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,1,power_law_1.2,0.05470719933509827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,balanced,0.22627200682957968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,power_law_1.01,0.07512959837913513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,1,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,balanced,0.3392159938812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,power_law_1.01,0.07822080254554749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,1,power_law_1.2,0.05614719986915588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,power_law_1.01,0.0950655996799469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,balanced,0.432528018951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,1,power_law_1.2,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,power_law_1.01,0.10049279928207397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,1,power_law_1.2,0.0645695984363556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,power_law_1.01,0.170687997341156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,balanced,0.6323839823404948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,1,power_law_1.2,0.06664320230484008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,power_law_1.01,0.1847615957260132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,1,power_law_1.2,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,power_law_1.01,0.2421567916870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,1,power_law_1.2,0.07258880138397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,balanced,0.8281226952870687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,balanced,0.06286933521429698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,balanced,0.08492799599965413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,power_law_1.01,0.27853438854217527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,1,power_law_1.2,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,balanced,0.08591467142105103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,power_law_1.01,0.3863679885864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,1,power_law_1.2,0.0802623987197876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,balanced,0.06324266890684764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,balanced,0.08546666304270427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,balanced,0.06233599781990051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,balanced,1.2152533531188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,1,power_law_1.2,0.09133440256118774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,power_law_1.01,0.4772480010986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,balanced,0.08624000350634257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,balanced,0.06507733464241028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,1,power_law_1.2,0.1009600043296814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,power_law_1.01,0.6787392139434815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,balanced,0.08717333277066548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,balanced,0.06488533318042755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,1,power_law_1.2,0.17363200187683106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,power_law_1.01,0.8705280303955079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,balanced,0.0867680013179779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,balanced,0.06553066770235698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,1,power_law_1.2,0.18844159841537475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,balanced,0.08649067083994548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,power_law_1.01,1.259552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,balanced,0.06631466746330261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,balanced,1.6053919792175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,1,power_law_1.2,0.2413696050643921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,balanced,0.08738666772842407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,balanced,0.06692266464233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,power_law_1.01,1.6525823593139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,1,power_law_1.2,0.27757439613342283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,balanced,0.09211732943852742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,balanced,0.06825600067774455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,power_law_1.01,2.0307584762573243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,balanced,0.09278933207194011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,balanced,0.06843199829260509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,1,power_law_1.2,0.38976640701293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,balanced,0.08906132976214091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,power_law_1.01,3.1769088745117187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,balanced,0.06822933256626129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,1,power_law_1.2,0.480947208404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,balanced,0.06781866649786632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,balanced,0.09153599540392558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,balanced,1.9932746887207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,1,power_law_1.2,0.6764287948608398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,power_law_1.01,6.242937469482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,balanced,0.06841599941253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,balanced,0.09143466750780742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,1,power_law_1.2,0.8669568061828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,balanced,0.07252266506354015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,balanced,0.10266133149464925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,balanced,0.07728533446788788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,1,power_law_1.2,1.2476863861083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,balanced,0.10311466455459595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,balanced,0.0793333351612091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,1,power_law_1.2,1.634048080444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,balanced,0.10505066315333049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,balanced,0.07945600152015686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,1,power_law_1.2,2.031532859802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,balanced,0.09340799848238628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,balanced,0.11570133765538533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,balanced,0.09842666983604431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,power_law_1.2,3.160767936706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,1,balanced,3.1676108042399087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,balanced,0.11742933591206868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,balanced,0.13537066181500754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,balanced,0.1295253336429596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,power_law_1.2,6.254463958740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,balanced,0.13525866468747458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,balanced,0.2053013245264689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,balanced,0.19338667392730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,balanced,0.17364267508188883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,balanced,0.22669333219528198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,balanced,0.3354346752166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,balanced,0.25754666328430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.01,0.08028799891471863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,balanced,0.2918773293495178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,balanced,0.39107199509938556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,balanced,0.055248002211252846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.01,0.08094720244407654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.01,0.06098560094833374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.01,0.08173440098762512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,balanced,0.4552853504816691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,balanced,0.05530133346716563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.01,0.08317440152168273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,balanced,0.5757706562678019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.01,0.06289920210838318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.01,0.08366720080375671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,balanced,0.05489600201447805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.01,0.06198400259017944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.01,0.08764799833297729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,balanced,0.5098613500595093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,balanced,0.05917333563168844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.01,0.09256960153579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.01,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,balanced,0.7375893592834473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,1,balanced,6.278703689575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,balanced,0.058517331878344216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.01,0.0991104006767273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.01,0.06461439728736877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.01,0.27974400520324705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,balanced,0.06011733412742615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,balanced,0.7709333101908366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.01,0.06652799844741822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.01,0.4287871837615967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,balanced,0.06043200194835663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.01,0.06832640171051026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,balanced,0.9172213077545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.01,0.9066240310668945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,balanced,0.06052266558011373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.01,0.07288960218429566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.01,0.9299776077270507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,balanced,1.0363679726918538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.01,0.07838720083236694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.01,0.9425919532775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.01,0.08548480272293091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.01,0.13497600555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.01,0.07578880190849305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,balanced,0.06248533229033152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.01,0.17824000120162964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.01,0.08965759873390197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,balanced,0.06287466486295064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,balanced,1.5233920415242512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,balanced,1.2606826623280842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.01,0.1870144009590149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.01,0.09194239974021912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.01,0.19574400186538696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.01,0.09505919814109802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.01,0.2554624080657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.01,0.10938880443572999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.01,0.31376640796661376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.01,0.13207039833068848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.01,0.14184319972991943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,balanced,2.1557440757751465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.01,0.42383360862731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,balanced,0.06282133360703786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.01,0.19621119499206544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.01,0.5333248138427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.01,0.26073598861694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,balanced,0.06401599943637848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.01,0.7422719955444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.01,0.34156160354614257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,balanced,0.06505066653092702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,balanced,2.9071839650472007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.01,0.9323712348937988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.01,0.3361855983734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,balanced,0.06477866570154826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.01,1.4099519729614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.01,0.4614272117614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.01,1.8861055374145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.01,0.569158411026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.01,2.6802175521850584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.01,0.8015487670898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.01,3.9902015686035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,balanced,4.053722699483235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.01,1.1539392471313477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.01,5.018022537231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.01,1.7264064788818358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.01,7.670297241210937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,balanced,0.07293333113193512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.01,2.269331169128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,balanced,0.07415999968846639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.01,15.461715698242188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,balanced,0.07513066629568736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.01,2.906604766845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.01,4.575046539306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,balanced,0.09156800309816997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.01,8.754994964599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,balanced,0.09523199995358785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,balanced,0.12195733189582825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,balanced,0.14626666903495789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,balanced,0.21320533752441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,balanced,0.25196800629297894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,balanced,0.41577064990997314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,power_law_1.01,0.05427839756011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,balanced,0.4967306852340698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,power_law_1.01,0.05408639907836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,power_law_1.01,0.05437440276145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,balanced,0.7530399958292643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,power_law_1.01,0.05811840295791626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,2,8,power_law_1.2,0.08305919766426087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,2,8,power_law_1.2,0.08438400030136109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,power_law_1.01,0.05894399881362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,2,8,power_law_1.2,0.08486400246620178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,balanced,1.001792033513387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,2,8,power_law_1.2,0.08558719754219055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,power_law_1.01,0.061843198537826535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,2,8,power_law_1.2,0.0863103985786438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,2,8,power_law_1.2,0.08963840007781983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,power_law_1.01,0.06869120001792908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,2,8,power_law_1.2,0.09470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,power_law_1.01,0.07523199915885925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,balanced,1.2389600276947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,2,8,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,2,8,power_law_1.2,0.4325376033782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,power_law_1.01,0.08223360180854797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,2,8,power_law_1.2,0.7657663822174072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,2,8,power_law_1.2,0.9186176300048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,2,8,power_law_1.2,0.9683520317077636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,2,8,power_law_1.2,0.9727807998657226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,balanced,1.9758399327596028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,2,8,power_law_1.2,0.1283136010169983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,power_law_1.01,0.07492480278015137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,2,8,power_law_1.2,0.15653120279312133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,2,8,power_law_1.2,0.17060480117797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,power_law_1.01,0.08394880294799804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,2,8,power_law_1.2,0.1887935996055603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,power_law_1.01,0.08325120210647582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,2,8,power_law_1.2,0.26869759559631345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,power_law_1.01,0.10959999561309815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,2,8,power_law_1.2,0.33639678955078123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,2,8,power_law_1.2,0.06128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,2,8,power_law_1.2,0.4578495979309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,2,8,power_law_1.2,0.5482304096221924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,2,8,power_law_1.2,0.06236159801483154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,power_law_1.01,0.1106112003326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,2,8,power_law_1.2,0.8183679580688477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,2,8,power_law_1.2,0.062009602785110474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,balanced,3.900383949279785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,power_law_1.01,0.12136960029602051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,2,8,power_law_1.2,0.9493568420410157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,2,8,power_law_1.2,0.06459519863128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,power_law_1.01,0.13934719562530518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,2,8,power_law_1.2,1.3814016342163087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,2,8,power_law_1.2,0.06485120058059693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,2,8,power_law_1.2,1.923980712890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,2,8,power_law_1.2,0.06628479957580566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,power_law_1.01,0.21155838966369628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,2,8,power_law_1.2,0.06908159852027893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,2,8,power_law_1.2,2.7186559677124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,power_law_1.01,0.23712000846862794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,2,8,power_law_1.2,0.07305600047111512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,2,8,power_law_1.2,3.8609344482421877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,2,8,power_law_1.2,0.07612159848213196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,power_law_1.01,0.3835455894470215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,2,8,power_law_1.2,0.08423039913177491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,2,8,power_law_1.2,4.460646438598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,2,8,power_law_1.2,0.07626879811286927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,2,8,power_law_1.2,0.05440639853477478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,2,8,power_law_1.2,0.08934400081634522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,power_law_1.01,0.4679232120513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,2,8,power_law_1.2,7.707308959960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,2,8,power_law_1.2,0.09184640049934387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,power_law_1.01,0.8561087608337402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,2,8,power_law_1.2,0.09388800263404846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,2,8,power_law_1.2,0.05438719987869263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,2,8,power_law_1.2,14.847859191894532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,2,8,power_law_1.2,0.11963520050048829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,power_law_1.01,0.9021696090698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,balanced,0.05766933163007101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,2,8,power_law_1.2,0.12698880434036255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,2,8,power_law_1.2,0.05443199872970581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,balanced,0.05738133192062378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,2,8,power_law_1.2,0.1394495964050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,balanced,0.08203733464082082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,power_law_1.01,1.526521587371826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,2,8,power_law_1.2,0.19277440309524535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,balanced,0.08535466591517131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,2,8,power_law_1.2,0.05780479907989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,2,8,power_law_1.2,0.25661439895629884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,power_law_1.01,1.872960090637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,balanced,0.08596266309420268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,2,8,power_law_1.2,0.05861120223999024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,2,8,power_law_1.2,0.38172800540924073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,power_law_1.01,2.459552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,balanced,0.08667199810345967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,2,8,power_law_1.2,0.3373503923416138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,2,8,power_law_1.2,0.0627776026725769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,balanced,0.08666666348775227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,power_law_1.01,3.3912254333496095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,2,8,power_law_1.2,0.5009215831756592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,2,8,power_law_1.2,0.5559807777404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,balanced,0.08681066830952962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,power_law_1.01,4.41847038269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,2,8,power_law_1.2,0.06883199810981751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,2,8,power_law_1.2,0.9184000015258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,balanced,0.04640000065167745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,balanced,0.08844266335169475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,balanced,0.0883840024471283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,power_law_1.01,7.08748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,2,8,power_law_1.2,1.2279744148254395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,balanced,0.043562665581703186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,2,8,power_law_1.2,0.07504000067710877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,balanced,0.05890666445096334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,balanced,0.09247466921806335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,2,8,power_law_1.2,1.7340991973876954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,power_law_1.01,12.867219543457031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,balanced,0.06305600206057231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,balanced,0.09344533085823059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,2,8,power_law_1.2,2.577004814147949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,2,8,power_law_1.2,0.08041599988937378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,balanced,0.062405332922935486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,balanced,0.09416000048319499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,2,8,power_law_1.2,3.1881471633911134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,balanced,0.06391466657320659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,2,8,power_law_1.2,0.08636800050735474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,balanced,0.0981333355108897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,2,8,power_law_1.2,4.588934326171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,balanced,0.06447466711203258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,balanced,0.10473066568374634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,2,8,power_law_1.2,9.19249267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,balanced,0.0642133355140686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,balanced,0.10563199718793233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,2,8,power_law_1.2,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,balanced,0.06541866560777028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,balanced,0.040336000422636666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,balanced,0.11161599556605022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,2,8,power_law_1.2,0.08666239976882935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,balanced,0.06558399895826976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,balanced,0.1178559958934784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,balanced,0.038405333956082664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,2,8,power_law_1.2,0.08958079814910888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,balanced,0.06564266482988994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,balanced,0.1411733329296112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,balanced,0.0533493310213089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,2,8,power_law_1.2,0.10661120414733886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,balanced,0.06763733426729839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,balanced,0.057130664587020874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,balanced,0.17525333166122437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,balanced,0.06888533135255177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,balanced,0.056976000467936196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,balanced,0.18530666828155518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,balanced,0.06924266616503398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,balanced,0.057904000083605446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,2,8,power_law_1.2,0.11188479661941528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,balanced,0.07983466486136119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,balanced,0.2571093241373698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,balanced,0.05851200222969055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,2,8,power_law_1.2,0.12396160364151002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,balanced,0.08158400158087413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,2,8,power_law_1.2,0.14979840517044068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,balanced,0.058592001597086586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,balanced,0.3083733320236206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,balanced,0.08362666765848796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,2,8,power_law_1.2,0.21144959926605225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,balanced,0.09297066926956177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,balanced,0.445087989171346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,2,8,power_law_1.2,0.29551360607147215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,balanced,0.06106133262316386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,balanced,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,balanced,0.06182399888833364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,2,8,power_law_1.2,0.4099584102630615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,balanced,0.5525013208389282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,balanced,0.13050132989883423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,2,8,power_law_1.2,0.49984002113342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,balanced,0.1479200025399526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,balanced,0.8210773468017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,2,8,power_law_1.2,0.811302375793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,balanced,0.20375466346740723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,2,8,power_law_1.2,0.9486207962036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,balanced,0.25673067569732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,balanced,1.0819520155588787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,2,8,power_law_1.2,1.4232192039489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,balanced,0.061754668752352394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,balanced,0.36101865768432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,2,8,power_law_1.2,1.6800512313842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,balanced,0.06296533346176147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,2,8,power_law_1.2,2.7805824279785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,balanced,0.4304266770680745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,balanced,0.06468266745408376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,balanced,1.3113226890563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,2,8,power_law_1.2,3.460230255126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,balanced,0.06505600114663442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,2,8,power_law_1.2,4.59119987487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,balanced,0.6360799868901571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,2,8,power_law_1.2,7.387168121337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,balanced,2.068357308705648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,2,8,power_law_1.2,13.335711669921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,balanced,0.8044640223185221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,balanced,0.07365333537260692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,balanced,0.07472533484299977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,balanced,0.9838026364644369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.01,0.07623040080070495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,balanced,0.07713599999745686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.01,0.07648640275001525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,balanced,0.09342400232950847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.01,0.08084480166435241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,balanced,0.10043733318646748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.01,0.08362879753112792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,balanced,4.035648028055827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,balanced,1.543733278910319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.01,0.08468480110168457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.01,0.08703359961509705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.01,0.09258239865303039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,balanced,0.13361066579818726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.01,0.09032319784164429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,balanced,0.16144532958666483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.01,0.38648319244384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.01,0.6803904056549073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,balanced,0.23145600159962973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.01,0.10093439817428589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,balanced,0.3078293402989705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.01,0.10391039848327636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,balanced,3.0049012502034507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.01,0.10415359735488891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.01,0.11891839504241944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.01,0.13687039613723756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,balanced,0.49208001295725506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.01,0.1580288052558899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.01,0.05592319965362549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.01,0.17646080255508423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.01,0.056383997201919556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,balanced,0.6501973470052084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.01,0.2026815891265869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.01,0.05551999807357788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.01,0.06211199760437012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.01,0.30462079048156737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.01,0.06239359974861145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,balanced,0.966048002243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.01,0.06503679752349853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.01,0.06565759778022766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.01,0.49390082359313964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.01,0.0679423987865448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,balanced,1.2829333146413167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.01,0.0654528021812439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.01,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.01,0.37835519313812255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.01,0.0728767991065979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.01,0.5161600112915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.01,0.07313920259475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,balanced,1.5834132830301921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,power_law_1.01,0.04682239890098572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.01,0.0790336012840271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.01,0.7864895820617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.01,0.08495360016822814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.01,0.09889919757843017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,power_law_1.01,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.01,1.116812801361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.01,0.10922240018844605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,power_law_1.01,0.0465472012758255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.01,0.11962239742279053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.01,1.5414655685424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.01,0.12438399791717529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,power_law_1.01,0.056480002403259275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,4,power_law_1.2,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.01,0.19301120042800904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,balanced,2.522885322570801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.01,2.0657535552978517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.01,0.2818880081176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,power_law_1.01,0.05633280277252197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,4,power_law_1.2,0.07122560143470764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.01,0.25426559448242186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.01,2.717075157165527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,power_law_1.01,0.05894399881362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.01,0.3330687999725342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,4,power_law_1.2,0.08120959997177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.01,3.062227249145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,power_law_1.01,0.06444799900054932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.01,0.5669439792633056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,4,power_law_1.2,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,power_law_1.01,0.06630399823188782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.01,0.631987190246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.01,5.232928085327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,4,power_law_1.2,0.08472959995269776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.01,0.9235584259033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,4,power_law_1.2,0.08769919872283935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.01,1.3021183967590333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,power_law_1.01,0.06765440106391907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.01,11.602899169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,4,power_law_1.2,0.09062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.01,1.7825983047485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,power_law_1.01,0.07401599884033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,4,power_law_1.2,0.09080960154533387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,balanced,5.027935981750488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.01,2.5482431411743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,4,power_law_1.2,0.5349120140075684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.01,3.591948699951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,4,power_law_1.2,0.6858496189117431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,power_law_1.01,0.07166079878807068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,4,power_law_1.2,0.09840000271797181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,power_law_1.01,0.07518720030784606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.01,8.001535797119141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,4,power_law_1.2,0.10487040281295776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,power_law_1.01,0.07690879702568054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,4,power_law_1.2,0.10828800201416015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,power_law_1.01,0.09376000165939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,4,power_law_1.2,0.12685439586639405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,4,power_law_1.2,0.131494402885437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,power_law_1.01,0.08780159950256347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,4,power_law_1.2,0.14275840520858765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,power_law_1.01,0.1044160008430481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,4,power_law_1.2,0.1751680016517639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,power_law_1.01,0.1279680013656616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,4,power_law_1.2,0.18703360557556153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,power_law_1.01,0.15029120445251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,4,power_law_1.2,0.29227519035339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,4,power_law_1.2,0.5156352043151855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,power_law_1.01,0.22088320255279542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,4,power_law_1.2,0.4404416084289551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,4,power_law_1.2,0.05279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,power_law_1.01,0.2302527904510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,4,power_law_1.2,0.540940809249878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,power_law_1.01,0.34301440715789794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,4,power_law_1.2,0.050521600246429446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,4,power_law_1.2,0.6866047859191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,power_law_1.01,0.6030144214630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,4,power_law_1.2,0.05917440056800842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,4,power_law_1.2,0.8440383911132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,power_law_1.01,0.6849855899810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,4,power_law_1.2,0.06178560256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,4,power_law_1.2,1.3225855827331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,4,power_law_1.2,0.06252800226211548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,4,power_law_1.2,2.2085119247436524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,power_law_1.01,1.202348804473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,4,power_law_1.2,0.06365439891815186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,4,power_law_1.2,2.3316736221313477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,power_law_1.01,1.7100479125976562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,4,power_law_1.2,0.06709120273590088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,4,power_law_1.2,0.06926720142364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,4,power_law_1.2,4.564019012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,power_law_1.01,2.833919906616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,4,power_law_1.2,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,4,power_law_1.2,5.3683326721191404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,4,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,power_law_1.01,3.422547149658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,4,power_law_1.2,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,4,power_law_1.2,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,power_law_1.01,4.08031997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,4,power_law_1.2,0.07089279890060425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,4,power_law_1.2,10.82097930908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,4,power_law_1.2,0.04776319861412048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,4,power_law_1.2,0.07926399707794189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,power_law_1.01,7.2806846618652346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,4,power_law_1.2,0.07966079711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,4,power_law_1.2,0.055904000997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,balanced,0.04138666639725367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,4,power_law_1.2,0.0567359983921051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,4,power_law_1.2,0.08270080089569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,balanced,0.056688000758488975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,power_law_1.01,13.33555908203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,4,power_law_1.2,0.05861759781837463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,4,power_law_1.2,0.10372480154037475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,balanced,0.08448533217112224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,4,power_law_1.2,0.06314880251884461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,balanced,0.08501866459846497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,4,power_law_1.2,0.11266560554504394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,4,power_law_1.2,0.0702015995979309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,balanced,0.0858026643594106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,balanced,0.08595200379689534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,4,power_law_1.2,0.10891519784927368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,balanced,0.08729599912961324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,4,power_law_1.2,0.07514240145683289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,balanced,0.08887466788291931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,4,power_law_1.2,0.13570560216903688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,balanced,0.08897067109743755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,4,power_law_1.2,0.07501440048217774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,4,power_law_1.2,0.1919935941696167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,balanced,0.0930560032526652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,balanced,0.09458133578300476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,4,power_law_1.2,0.2522304058074951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,balanced,0.09559999903043111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,4,power_law_1.2,0.07381119728088378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,4,power_law_1.2,0.26837759017944335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,balanced,0.09908800323804219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,4,power_law_1.2,0.07607679963111877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,balanced,0.1039573351542155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,4,power_law_1.2,0.45452160835266114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,balanced,0.10636799534161885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,4,power_law_1.2,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,balanced,0.11546132961908977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,4,power_law_1.2,0.5559552192687989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,4,power_law_1.2,0.09177600145339966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,balanced,0.12147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,4,power_law_1.2,0.7606207847595214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,balanced,0.12736533085505167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,4,power_law_1.2,0.8785728454589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,balanced,0.18247467279434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,4,power_law_1.2,1.2744256019592286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,balanced,0.19747199614842734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,4,power_law_1.2,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,4,power_law_1.2,1.928870391845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,balanced,0.27454400062561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,4,power_law_1.2,0.10047999620437623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,4,power_law_1.2,0.12188160419464111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,4,power_law_1.2,2.5097280502319337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,balanced,0.3421386480331421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,4,power_law_1.2,0.17278079986572265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,balanced,0.48877867062886554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,4,power_law_1.2,4.245139312744141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,4,power_law_1.2,0.19385600090026855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,balanced,0.5987253189086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,4,power_law_1.2,7.091327667236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,4,power_law_1.2,0.2678911924362183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,balanced,0.9137173493703207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,4,power_law_1.2,0.2987584114074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,4,power_law_1.2,0.7217535972595215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,4,power_law_1.2,0.893887996673584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,balanced,1.1933546861012776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,balanced,0.03620799879233042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,4,power_law_1.2,1.409926414489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,balanced,0.042506664991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,balanced,1.4844746589660645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.01,0.05508480072021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,balanced,0.05825600028038025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,4,power_law_1.2,1.872889518737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,balanced,0.061568001906077065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.01,0.058508801460266116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,balanced,0.06171200176080068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,4,power_law_1.2,2.7416767120361327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,balanced,0.0627040018637975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.01,0.06049280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,balanced,0.06357866525650024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,4,power_law_1.2,3.615500640869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.01,0.08047999739646912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,balanced,0.06440000236034393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,balanced,2.330495993296305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.01,0.08293120265007019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,balanced,0.06428266565004985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,4,power_law_1.2,4.423712158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,balanced,0.06481599807739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.01,0.08597760200500489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,balanced,0.06669333577156067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,4,power_law_1.2,7.571270751953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.01,0.08974720239639282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,balanced,0.06710400183995564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,balanced,0.0680320014556249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.01,0.09128320217132568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,balanced,0.02898666759332021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,balanced,0.07006399830182393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.01,0.236844801902771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,4,power_law_1.2,15.653900146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,balanced,0.0787360022465388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,balanced,0.036746665835380554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.01,0.37699840068817136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,balanced,0.07944533228874207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,balanced,0.052042668064435325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,balanced,0.0848640004793803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.01,0.09716479778289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,balanced,0.0944640040397644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,balanced,0.056101332108179726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,balanced,4.317829449971517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.01,0.10378880500793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,balanced,0.10500267148017883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,balanced,0.05633600056171417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.01,0.10434559583663941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,balanced,0.13858133554458618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,balanced,0.05747200051943461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.01,0.1258944034576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,balanced,0.15838399529457092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,balanced,0.05850133299827576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.01,0.12466559410095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,balanced,0.21913067499796549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,balanced,0.05926933387915293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.01,0.12437119483947753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,balanced,0.2797279953956604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.01,0.11630079746246338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.01,0.16661759614944457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,balanced,0.39046398798624676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.01,0.18143999576568604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,balanced,0.06027733286221822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,balanced,0.4843573172887166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.01,0.2263040065765381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,balanced,0.061050668358802795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.01,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.01,0.40579838752746583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,balanced,0.7172746658325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.01,0.501913595199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.01,0.7625664234161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.01,0.8929023742675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,balanced,0.9223146438598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.01,1.4061568260192872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.01,0.04214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.01,1.6253183364868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,balanced,1.1341919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.01,0.04503040015697479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.01,2.3736831665039064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.01,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.01,3.433484649658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,balanced,0.06342400113741557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.01,0.06056960225105286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,power_law_1.01,0.03480319976806641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.01,0.06159359812736511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.01,6.4757568359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,balanced,1.7973653475443523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,power_law_1.01,0.04270719885826111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,balanced,0.06678399940331776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.01,0.06340479850769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,power_law_1.01,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,balanced,0.06838933130105336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.01,0.06490240097045899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,power_law_1.01,0.05575039982795715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,power_law_1.01,0.056908798217773435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.01,0.06673920154571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,power_law_1.01,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,power_law_1.01,0.062412798404693604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.01,0.06775680184364319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,power_law_1.01,0.06303359866142273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,balanced,0.07805866499741872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.01,0.06665599942207337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,balanced,0.07960000137488048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.01,0.07069439888000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,balanced,3.3950719833374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,power_law_1.01,0.06442880034446716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,balanced,0.08525333801905315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.01,0.07115520238876342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,power_law_1.01,0.06734079718589783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.01,0.07246720194816589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,balanced,0.10493866602579753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.01,0.0847487986087799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,balanced,0.11530133088429768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.01,0.09057279825210571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,power_law_1.01,0.07089920043945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,balanced,0.15270933508872986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.01,0.09348480105400085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,power_law_1.01,0.07307519912719726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,balanced,0.19401599963506064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.01,0.10644479990005493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,power_law_1.01,0.07550079822540283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,balanced,0.29370667537053424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,power_law_1.01,0.0843392014503479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.01,0.11966079473495483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.01,0.14016640186309814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,balanced,0.3938080072402954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,power_law_1.01,0.09382399916648865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.01,0.1855936050415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.01,0.2178368091583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,power_law_1.01,0.09499520063400269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.01,0.26981120109558104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,2,power_law_1.2,0.057555198669433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,power_law_1.01,0.11320320367813111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.01,0.3546751976013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,power_law_1.01,0.13626240491867064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,2,power_law_1.2,0.055180799961090085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.01,0.5049280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,power_law_1.01,0.16757760047912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,2,power_law_1.2,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,balanced,0.6035306851069132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.01,0.7251967906951904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,power_law_1.01,0.22968320846557616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,2,power_law_1.2,0.08300160169601441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.01,1.0817791938781738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,power_law_1.01,0.29552640914916994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,balanced,0.7927146752675375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,2,power_law_1.2,0.08315520286560059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.01,1.2184384346008301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,power_law_1.01,0.46979198455810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,power_law_1.01,0.6488128185272217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,2,power_law_1.2,0.08532480001449586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.01,1.717478370666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,2,power_law_1.2,0.08709120154380798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,balanced,1.1733706792195637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.01,2.916921615600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,power_law_1.01,0.8049599647521972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,2,power_law_1.2,0.0917952001094818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,power_law_1.01,1.147539234161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,2,power_law_1.2,0.37616639137268065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.01,5.2278400421142575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,power_law_1.01,1.7313919067382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,2,power_law_1.2,0.5198912143707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,balanced,1.5451946258544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,power_law_1.01,2.1374591827392577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,2,power_law_1.2,0.10151040554046631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,power_law_1.01,3.232147216796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,2,power_law_1.2,0.10402560234069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,power_law_1.01,4.345427322387695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,2,power_law_1.2,0.1018496036529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,balanced,1.916170597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,2,power_law_1.2,0.12254719734191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,power_law_1.01,10.482444763183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,2,power_law_1.2,0.12394239902496337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,2,power_law_1.2,0.1280832052230835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,2,power_law_1.2,0.04286080002784729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,2,power_law_1.2,0.13301759958267212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,2,power_law_1.2,0.17828480005264283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,2,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,balanced,3.0408480962117515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,2,power_law_1.2,0.18919680118560792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,2,power_law_1.2,0.04806399941444397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,2,power_law_1.2,0.06037759780883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,2,power_law_1.2,0.24872961044311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,2,power_law_1.2,0.06151679754257202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,2,power_law_1.2,0.3299328088760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,2,power_law_1.2,0.06170240044593811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,2,power_law_1.2,0.39836161136627196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,2,power_law_1.2,0.06606079936027527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,balanced,6.03652826944987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,2,power_law_1.2,0.513753604888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,2,power_law_1.2,0.06698240041732788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,2,power_law_1.2,0.06737279891967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,2,power_law_1.2,0.6689151763916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,2,power_law_1.2,0.06748800277709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,2,power_law_1.2,0.9619968414306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,2,power_law_1.2,0.07167360186576843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,2,power_law_1.2,0.07273600101470948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,2,power_law_1.2,1.4214464187622071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,2,power_law_1.2,0.07242239713668823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,2,power_law_1.2,0.08373759984970093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,2,power_law_1.2,1.952774429321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,2,power_law_1.2,0.08991360068321227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,2,power_law_1.2,2.325497627258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,2,power_law_1.2,0.09171199798583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,2,power_law_1.2,0.10306559801101685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,2,power_law_1.2,3.924224090576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,2,power_law_1.2,0.13425920009613038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,2,power_law_1.2,0.149452805519104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,2,power_law_1.2,6.767692565917969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,2,power_law_1.2,0.17993600368499757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,2,power_law_1.2,0.21566081047058105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,2,power_law_1.2,0.29877119064331054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,2,power_law_1.2,0.40833277702331544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,2,power_law_1.2,0.5618368148803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,2,power_law_1.2,0.7243264198303223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,2,power_law_1.2,1.0326592445373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,2,power_law_1.2,1.3734144210815429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,2,power_law_1.2,1.7770111083984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,2,power_law_1.2,2.784819221496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,2,power_law_1.2,4.2863616943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,balanced,0.04363733530044556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,balanced,0.05653333167235056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,balanced,0.07814933359622955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,balanced,0.08480532964070638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,2,power_law_1.2,0.036934399604797365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,balanced,0.08122133215268452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,2,power_law_1.2,0.038649600744247434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,balanced,0.08193600177764893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,2,power_law_1.2,0.04288640022277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,balanced,0.08253333469231923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,2,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,balanced,0.08707200487454732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,2,power_law_1.2,0.05629439949989319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,balanced,0.08973333239555359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,2,power_law_1.2,0.0607807993888855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,balanced,0.08981866637865703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,2,power_law_1.2,0.06293759942054748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,balanced,0.09391466776529948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,balanced,0.09638399879137675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,2,power_law_1.2,0.06466559767723083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,balanced,0.09754133224487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,balanced,0.1030346651871999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,2,power_law_1.2,0.06600319743156433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,balanced,0.11163199941317241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,2,power_law_1.2,0.06684160232543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,balanced,0.11290132999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,balanced,0.1200266679128011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,balanced,0.15185599525769553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,2,power_law_1.2,0.07139840126037597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,balanced,0.14683199922243753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,2,power_law_1.2,0.07291520237922669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,balanced,0.1873706579208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,2,power_law_1.2,0.07449600100517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,2,power_law_1.2,0.07603840231895446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,balanced,0.22081599632898966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,balanced,0.3089653253555298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,2,power_law_1.2,0.09444479942321778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,balanced,0.39638932545979816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,2,power_law_1.2,0.09568639993667602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,2,power_law_1.2,0.11178239583969116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,balanced,0.5680319865544637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,2,power_law_1.2,0.14568959474563598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,balanced,0.04077333211898804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,2,power_law_1.2,0.17770880460739136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,balanced,0.058789332707722984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,balanced,0.7242773373921713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.04845440089702606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,balanced,0.06272533535957336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,2,power_law_1.2,0.22867839336395263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.05486080050468445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,balanced,0.06292800108591716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,2,power_law_1.2,0.3178879976272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,balanced,1.096981366475423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,balanced,0.06324266890684764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.081632000207901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,2,power_law_1.2,0.41281280517578123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.03681280016899109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,balanced,0.06506666541099548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.07881600260734559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,2,power_law_1.2,0.6832831859588623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,balanced,0.06429333488146464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.08125439882278443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,balanced,0.06506666541099548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,balanced,1.3816426595052083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.04248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,balanced,0.06647466619809468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,2,power_law_1.2,0.9558272361755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,balanced,0.03014400104681651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.060096001625061034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,balanced,0.06797866523265839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,2,power_law_1.2,1.2425536155700683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,balanced,0.07002666592597961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.2314687967300415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.060108798742294314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,balanced,1.6880799929300945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,2,power_law_1.2,1.886400032043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,balanced,0.03722666700681051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,balanced,0.07167999943097432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.6481791973114014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.06376320123672485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,balanced,0.0753119985262553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,balanced,0.05407999952634176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,2,power_law_1.2,2.732211112976074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.09971839785575867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.06610559821128845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,balanced,0.08306666711966197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.10236799716949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,balanced,0.05820799867312113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,2,power_law_1.2,2.9279808044433593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.06583679914474487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,balanced,0.08392533659934998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.10400639772415161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,balanced,0.05789333085219065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.06707199811935424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,balanced,2.6415039698282876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,balanced,0.09142933289210002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,2,power_law_1.2,5.16382064819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.11745280027389526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,balanced,0.28758933146794635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.06836479902267456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,balanced,0.11169067025184631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,balanced,0.061018665631612144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.06901119947433472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.13820159435272217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,2,power_law_1.2,10.338066864013673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,balanced,0.12102933724721272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,balanced,0.0613919993241628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.07511680126190186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.13213440179824829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.07546240091323853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,balanced,0.15782399972279867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.12707200050354003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.08859519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.16750719547271728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,balanced,0.18289599816004434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.09351680278778077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.18108160495758058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,balanced,0.26410667101542157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.09672319889068604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,balanced,0.06412800153096516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.21091198921203613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,balanced,0.34384000301361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,balanced,5.105999946594238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,balanced,0.06547733147939046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.24113919734954833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.12551039457321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,balanced,0.4918239911397298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.31831679344177244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.1375167965888977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,power_law_1.01,0.031206399202346802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.4084159851074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.01,0.17794560194015502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,balanced,0.63045867284139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.04345600008964538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,power_law_1.01,0.032543998956680295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.19211519956588746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.01,0.577023983001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.04684799909591675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,power_law_1.01,0.04002560079097748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.01,0.7614336013793945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,balanced,0.9233226776123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,balanced,0.06810133159160614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.34323840141296386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,power_law_1.01,0.05469440221786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.01,1.1348992347717286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.0816703975200653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,power_law_1.01,0.05667200088500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,balanced,0.07160000006357829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,0.4787136077880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.01,1.4222911834716796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,balanced,0.07375999788443248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,balanced,1.1984799702962239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.07875199913978577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,power_law_1.01,0.058323198556900026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,0.6147136211395263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.01,1.7999935150146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,balanced,0.07746133208274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.0813759982585907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,0.9003775596618653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,power_law_1.01,0.061715197563171384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.01,2.631020736694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.08772479891777038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,power_law_1.01,0.06449919939041138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,1.2099904060363769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,balanced,1.4774932861328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.01,5.110515213012695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.09127039909362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.01,1.5142144203186034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,balanced,0.08887466788291931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.5156223773956299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.01,2.3939008712768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,power_law_1.01,0.06721919775009155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,balanced,0.09285333752632141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.8057600021362304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,balanced,0.10040533542633057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.01,4.365254211425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,power_law_1.01,0.06858879923820496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.09690240025520325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,balanced,0.13226133584976196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,balanced,0.150629331668218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,balanced,2.350122610727946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.10250879526138305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,balanced,0.22275733947753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.10358400344848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,power_law_1.01,0.07444480061531067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,balanced,0.2959466576576233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,power_law_1.01,0.07541120052337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.12120959758758545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,balanced,0.42766400178273517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,power_law_1.01,0.07795199751853943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.13008639812469483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,balanced,0.5593279997507731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,power_law_1.01,0.08214399814605713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.13276159763336182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.12445440292358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,power_law_1.01,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.16895359754562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,balanced,4.507722536722819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,power_law_1.01,0.10152319669723511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,balanced,0.8446613152821859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.17431679964065552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.21222400665283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,power_law_1.01,0.11145600080490112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,balanced,1.1027572949727376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.23447680473327637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,power_law_1.01,0.1362496018409729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.3159615993499756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.01,0.16591999530792237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,balanced,1.6378080050150554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.4042623996734619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.01,0.24060161113739015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,1,power_law_1.2,0.5842239856719971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.01,0.3089600086212158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,balanced,2.1720639864603677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,1,power_law_1.2,0.7682623863220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.01,0.44490880966186525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,1,power_law_1.2,1.1608256340026855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.01,0.5707647800445557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,1,power_law_1.2,1.4288384437561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.01,0.8551487922668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,balanced,2.6877867380777993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,1,power_law_1.2,1.790425682067871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.01,1.1141440391540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,1,power_law_1.2,2.625766372680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.01,1.6358783721923829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,1,power_law_1.2,5.120537567138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.01,2.1664960861206053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,balanced,4.282853444417317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.01,2.702841567993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,power_law_1.01,4.292595291137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,power_law_1.01,8.55910415649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,balanced,8.528373082478842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.03560959994792938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.045664000511169436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.06069759726524353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.060313600301742556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,1,power_law_1.2,0.03025279939174652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.06392959952354431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,1,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.0654528021812439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,1,power_law_1.2,0.03638400137424469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.06782720088958741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,1,power_law_1.2,0.05546879768371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.06952319741249084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,1,power_law_1.2,0.05594239830970764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.06857600212097167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,1,power_law_1.2,0.060121601819992064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,1,power_law_1.2,0.06401280164718628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.07312639951705932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,1,power_law_1.2,0.06564480066299438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.07555840015411378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.08187519907951354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,balanced,0.09073600172996521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.09538559913635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,balanced,0.14121599992116293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,1,power_law_1.2,0.06871039867401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,balanced,0.08162133395671844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.09433599710464477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,balanced,0.12291733423868816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,1,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,balanced,0.0812906672557195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,balanced,0.12239999572436015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,balanced,0.085807998975118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.09713280200958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,balanced,0.12478933731714885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,balanced,0.0857919951279958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.1295040011405945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,balanced,0.08676266670227051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,balanced,0.12476266423861186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,1,power_law_1.2,0.0765504002571106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,balanced,0.08780266841252644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,balanced,0.1253866652647654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,1,power_law_1.2,0.07785599827766418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.13871359825134277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,balanced,0.08745599786440532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,balanced,0.12596266468365988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,1,power_law_1.2,0.07925119996070862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,balanced,0.08805333574612935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.1794816017150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,balanced,0.12713066736857095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,balanced,0.08960533142089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,1,power_law_1.2,0.08367999792098998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,balanced,0.09287466605504353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.1918463945388794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,balanced,0.12934399644533792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,balanced,0.09046933054924011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.2661184072494507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,balanced,0.12900267044703165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,1,power_law_1.2,0.09882240295410157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,balanced,0.09215999643007915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,balanced,0.09355200330416362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.34138879776000974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,balanced,0.1357599993546804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,1,power_law_1.2,0.09998080134391785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,balanced,0.10845866799354553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,0.4814015865325928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,balanced,0.13403733571370444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,1,power_law_1.2,0.1115007996559143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,balanced,0.11055999994277954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,balanced,0.1346986691157023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,1,power_law_1.2,0.14473600387573243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,balanced,0.11035733421643575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,0.6217088222503662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,balanced,0.12909332911173502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.2,0.16660480499267577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,balanced,0.14614933729171753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,0.9114175796508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,balanced,0.08435733119646709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,balanced,0.13142933448155722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.2,0.2394047975540161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,balanced,0.1625546713670095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,1.2144000053405761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,balanced,0.19690134127934775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.2,0.31103360652923584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,balanced,0.16500799854596457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,balanced,0.18992000818252563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,balanced,0.07517333328723907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,1,power_law_1.2,1.519379234313965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.2,0.44394879341125487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,balanced,0.1590506633122762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,balanced,0.28359999259312946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.2,0.5757952213287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,balanced,0.07489599784215291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,1,power_law_1.2,2.374092864990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,balanced,0.18838399648666382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,balanced,0.33689598242441815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,balanced,0.07884799937407176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,balanced,0.1729653278986613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,1,power_law_1.2,4.374297714233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.2,0.8713472366333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,balanced,0.48099732398986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,balanced,0.07890133559703827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,balanced,0.3566879828770955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.2,1.117728042602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,balanced,0.07960000137488048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.01,0.13925119638442993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,balanced,0.5888640085856119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,balanced,0.25598933299382526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.2,1.6542207717895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,balanced,0.08081066608428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.01,0.12117760181427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.2,2.18143367767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,balanced,0.3991039991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,balanced,0.08056533336639404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,balanced,0.8802613417307535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.01,0.12088960409164429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.2,2.7264192581176756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,balanced,0.4663306474685669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.01,0.12412159442901612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,1,power_law_1.2,4.313772964477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,balanced,0.08435733119646709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,balanced,1.1686773300170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.01,0.1241919994354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,balanced,0.6786986986796061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,balanced,0.0858026643594106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.01,0.13086719512939454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,1,power_law_1.2,8.582527923583985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.01,0.08993279933929443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,balanced,0.8166879812876383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.01,0.13935359716415405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,balanced,1.4727999369303386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.01,0.13338880538940429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,balanced,1.2378133138020833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.01,0.08095999956130981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.01,0.6433216094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.01,0.08119040131568908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.01,1.403116798400879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,balanced,0.08517332871754964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,balanced,1.5867466926574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,balanced,2.285520076751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.01,0.08506879806518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.01,1.3595775604248046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,balanced,0.08676266670227051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.01,0.08497920036315917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,balanced,0.08813333511352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.01,1.4061568260192872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,balanced,0.08852266271909077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.01,0.08810240030288696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.01,1.4689663887023925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,balanced,2.023248036702474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.01,0.1009600043296814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.01,0.1934272050857544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.01,0.09015679955482483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,power_law_1.01,0.0830847978591919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.01,0.2421056032180786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.01,0.09590399861335755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,power_law_1.01,0.07402240037918091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,power_law_1.01,0.07443199753761291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.01,0.25645439624786376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.01,0.10005120038986207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,balanced,4.526032129923503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,power_law_1.01,0.07773439884185791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,balanced,3.221861203511556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.01,0.404256010055542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.01,0.09750400185585022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,power_law_1.01,0.07861120104789734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,balanced,0.09724799791971843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,power_law_1.01,0.08923519849777221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.01,0.658457612991333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.01,0.10417920351028442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,balanced,0.10044800241788228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,power_law_1.01,0.10430079698562622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.01,0.11397759914398194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,power_law_1.01,0.10910719633102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.01,0.5427135944366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,balanced,0.1029919981956482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.01,0.12894079685211182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.01,0.7306687831878662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,power_law_1.01,0.11395839452743531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.01,0.16342400312423705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.01,0.7263552188873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,power_law_1.01,0.12412799596786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.01,0.19470080137252807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.01,1.0843392372131349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.01,0.23671040534973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,balanced,0.12383466958999634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.01,1.4319104194641112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.01,0.3111680030822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,balanced,6.641712188720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,balanced,0.13012799620628357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,power_law_1.01,0.10469119548797608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.01,0.3654335975646973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.01,2.3058048248291017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,power_law_1.01,0.12161279916763305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.01,0.5496831893920898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,power_law_1.01,0.1342527985572815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.01,2.8235008239746096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,power_law_1.01,0.15997439622879028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.01,0.46944642066955566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,balanced,0.17824532588322958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.01,4.546131134033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.01,0.6636991977691651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,balanced,0.22064000368118286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.01,0.8530752182006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,power_law_1.01,0.15459200143814086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.01,6.140108871459961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,power_law_1.01,0.14881919622421264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.01,1.2605055809020995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,balanced,0.3275946577390035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.01,9.037574768066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,power_law_1.01,0.1956928014755249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.01,1.8577856063842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,balanced,0.36559998989105225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,power_law_1.01,0.2926079988479614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.01,2.800908851623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.01,14.288946533203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,power_law_1.01,0.36959359645843504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.01,3.6835006713867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,power_law_1.01,0.6521152019500732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.01,25.354035949707033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.01,3.845907211303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,power_law_1.01,0.75033597946167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,balanced,0.5825440088907877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,power_law_1.01,1.0719167709350585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.01,6.326752090454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,power_law_1.01,1.1576319694519044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.01,14.70043487548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,balanced,0.755237340927124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,power_law_1.01,2.015238380432129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,power_law_1.01,2.6237056732177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,power_law_1.01,3.8688129425048827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,balanced,1.1283573309580486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,power_law_1.01,5.502848052978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,power_law_1.01,6.675590515136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,balanced,1.4881226221720378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,power_law_1.01,9.744691467285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,balanced,1.8498506546020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,power_law_1.01,22.55278778076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,balanced,2.948474566141764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,2,8,power_law_1.2,0.13912960290908813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,2,8,power_law_1.2,0.1210752010345459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,2,8,power_law_1.2,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,2,8,power_law_1.2,0.12444800138473511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,2,8,power_law_1.2,0.12444800138473511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,balanced,5.880954742431641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,2,8,power_law_1.2,0.1335487961769104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,2,8,power_law_1.2,0.08934400081634522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,2,8,power_law_1.2,0.14846080541610718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,2,8,power_law_1.2,0.1370687961578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,2,8,power_law_1.2,0.08168320059776306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,2,8,power_law_1.2,0.38839681148529054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,2,8,power_law_1.2,0.08158720135688782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,2,8,power_law_1.2,0.896998405456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,2,8,power_law_1.2,0.08531200289726257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,2,8,power_law_1.2,1.1443519592285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,2,8,power_law_1.2,0.08607360124588012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,2,8,power_law_1.2,1.453376007080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,2,8,power_law_1.2,0.09102079868316651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,2,8,power_law_1.2,1.4392383575439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,2,8,power_law_1.2,0.09565439820289612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,2,8,power_law_1.2,0.20177919864654542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,2,8,power_law_1.2,0.09038720130920411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,2,8,power_law_1.2,0.2990015983581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,2,8,power_law_1.2,0.09886720180511474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,2,8,power_law_1.2,0.25601279735565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,2,8,power_law_1.2,0.09907839894294738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,2,8,power_law_1.2,0.3671999931335449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,2,8,power_law_1.2,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,2,8,power_law_1.2,0.08293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,2,8,power_law_1.2,0.10488959550857543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,2,8,power_law_1.2,0.6305280208587647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,2,8,power_law_1.2,0.11249920129776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,2,8,power_law_1.2,0.5346047878265381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,2,8,power_law_1.2,0.07399680018424988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,2,8,power_law_1.2,0.13941760063171388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,2,8,power_law_1.2,0.07449600100517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,2,8,power_law_1.2,0.1897279977798462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,2,8,power_law_1.2,0.7294079780578613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,2,8,power_law_1.2,0.21334400177001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,2,8,power_law_1.2,0.07768319845199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,2,8,power_law_1.2,0.7829504013061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,2,8,power_law_1.2,0.2161344051361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,2,8,power_law_1.2,0.07850239872932434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,2,8,power_law_1.2,1.1674816131591796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,2,8,power_law_1.2,0.3268928050994873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,2,8,power_law_1.2,0.08533759713172913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,2,8,power_law_1.2,0.4039423942565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,2,8,power_law_1.2,1.4685888290405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,2,8,power_law_1.2,0.6052735805511474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,2,8,power_law_1.2,0.10836479663848878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,2,8,power_law_1.2,2.498931121826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,2,8,power_law_1.2,0.48769278526306153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,2,8,power_law_1.2,0.1118016004562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,2,8,power_law_1.2,0.7012351989746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,2,8,power_law_1.2,2.659744071960449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,balanced,0.08172800143559773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,2,8,power_law_1.2,0.9273728370666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,2,8,power_law_1.2,4.7383872985839846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,2,8,power_law_1.2,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,2,8,power_law_1.2,1.5217791557312013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,balanced,0.08014933268229167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,2,8,power_law_1.2,1.7543359756469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,2,8,power_law_1.2,0.12321280241012574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,balanced,0.12236266334851582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,2,8,power_law_1.2,7.045728302001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,2,8,power_law_1.2,2.7005695343017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,balanced,0.12689066926638284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,2,8,power_law_1.2,3.9287166595458984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,2,8,power_law_1.2,8.488870239257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,balanced,0.12640532851219177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,2,8,power_law_1.2,0.10459519624710083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,balanced,0.12691733241081238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,2,8,power_law_1.2,4.8706817626953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,balanced,0.1281013290087382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,2,8,power_law_1.2,0.12111999988555908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,2,8,power_law_1.2,14.110566711425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,2,8,power_law_1.2,6.657939147949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,balanced,0.12847466270128885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,2,8,power_law_1.2,0.12359039783477783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,balanced,0.13082133730252585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,2,8,power_law_1.2,0.15466879606246947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,balanced,0.06088533500830332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,2,8,power_law_1.2,15.155596923828124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,2,8,power_law_1.2,22.656556701660158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,balanced,0.131221334139506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,balanced,0.05663466453552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,balanced,0.14031466841697693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,2,8,power_law_1.2,0.16082559823989867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,balanced,0.1388266682624817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,balanced,0.08528000116348267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,2,8,power_law_1.2,0.17150720357894897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,balanced,0.13940266768137613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,balanced,0.08405866225560506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,2,8,power_law_1.2,0.21191039085388183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,balanced,0.1402666668097178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,balanced,0.08520533641179402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,balanced,0.1555519998073578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,2,8,power_law_1.2,0.3089087963104248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,balanced,0.08649599552154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,balanced,0.15741866827011108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,balanced,0.08678932984670003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,2,8,power_law_1.2,0.40711679458618166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,balanced,0.15988266468048096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,balanced,0.08699733018875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,balanced,0.17484800020853677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,balanced,0.08915733297665913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,2,8,power_law_1.2,0.6506815910339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,balanced,0.08989333113034566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,2,8,power_law_1.2,0.8455679893493653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,balanced,0.17577066024144491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,balanced,0.08979733784993489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,2,8,power_law_1.2,1.0386303901672362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,balanced,0.2834506630897522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,balanced,0.09293867150942485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,2,8,power_law_1.2,1.4040063858032226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,balanced,0.27405333518981934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,balanced,0.09454933802286784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.01,0.13390079736709595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,balanced,0.1069599986076355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,balanced,0.38005868593851727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,2,8,power_law_1.2,2.218361663818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.01,0.11123199462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,balanced,0.10610133409500122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,balanced,0.4577386776606242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.01,0.10497920513153076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,balanced,0.11215999722480774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,2,8,power_law_1.2,2.789190483093262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,balanced,0.05426666637261709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,balanced,0.1276800036430359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.01,0.1254591941833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,2,8,power_law_1.2,4.181593704223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,balanced,0.05031999945640564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,balanced,0.6779200236002604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,balanced,0.13220266501108804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.01,0.1260032057762146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,balanced,0.07378666599591573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,2,8,power_law_1.2,5.239276885986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,balanced,0.2019360065460205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.01,0.13266559839248657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,balanced,0.9161120255788168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,balanced,0.07796800136566162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.01,0.13556480407714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,2,8,power_law_1.2,6.543513488769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,balanced,0.2044960061709086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,balanced,0.07764266431331635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.01,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,balanced,1.3848053614298503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,balanced,0.2824053366978963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,2,8,power_law_1.2,10.352928161621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,balanced,0.07889066636562347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.01,0.36062719821929934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,balanced,0.3412746588389079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,balanced,0.08051733175913493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.01,1.251360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,balanced,1.741498629252116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,2,8,power_law_1.2,21.925637817382814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,balanced,0.49538131554921466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,balanced,0.07983466486136119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.01,0.1580288052558899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.01,0.16532479524612426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,balanced,0.6438773473103842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.01,0.1604159951210022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,balanced,2.1915733019510903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.01,0.0770687997341156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.01,0.2066943883895874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.01,0.07613440155982971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,balanced,0.9476799964904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.01,0.24348800182342528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,balanced,0.08115200201670329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.01,0.06935039758682252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.01,0.08307200074195861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.01,0.2649343967437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,balanced,0.08206399778525035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.01,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,balanced,3.4167467753092446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.01,0.21746559143066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,balanced,1.2459626992543538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.01,0.08188160061836243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.01,0.2963007926940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.01,0.08840320110321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.01,0.08963840007781983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.01,0.3347264051437378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.01,0.09262719750404358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,balanced,1.5553760528564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.01,0.09383040070533752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.01,0.48244481086730956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.01,0.09806079864501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.01,0.10189440250396728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.01,0.5371712207794189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,balanced,0.0848426620165507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.01,0.10349440574645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.01,0.7563776016235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.01,0.12161920070648194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,balanced,0.0862613320350647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.01,1.0553152084350585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.01,0.15615999698638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,balanced,2.4101866086324057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,balanced,6.469280242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,balanced,0.08875733613967896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.01,0.13833600282669067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.01,1.5374336242675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.01,0.16035200357437135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,balanced,0.08946667114893596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.01,2.392582321166992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.01,0.21388800144195558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.01,0.2234560012817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.01,2.987763214111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.01,0.3506367921829224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.01,0.41368961334228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.01,4.627481460571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,balanced,0.09969066580136617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.01,0.5541312217712402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,balanced,0.1011946698029836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.01,4.821420669555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.01,0.6990015983581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,balanced,0.10664000113805135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.01,0.9676095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,balanced,4.7243092854817705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.01,8.910431671142579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.01,1.5812800407409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,balanced,0.1328426698843638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.01,2.5737791061401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,balanced,0.1421119968096415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.01,2.9178815841674806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.01,18.0300537109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,balanced,0.19293334086736044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.01,4.01712646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,balanced,0.24336532751719156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.01,4.793401718139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.01,11.6840576171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,balanced,0.3599253495534261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,balanced,0.48775466283162433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,4,power_law_1.2,0.12200959920883178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,balanced,0.7566933631896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,4,power_law_1.2,0.10026880502700805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,balanced,0.9963573614756266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,4,power_law_1.2,0.09592959880828858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,power_law_1.01,0.0652288019657135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,4,power_law_1.2,0.12553600072860718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,power_law_1.01,0.06446080207824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,balanced,1.4817387262980144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,4,power_law_1.2,0.12537599802017213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,power_law_1.01,0.06926720142364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,4,power_law_1.2,0.13197439908981323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,power_law_1.01,0.0778880000114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,4,power_law_1.2,0.13537280559539794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,power_law_1.01,0.07912960052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,balanced,1.9676586786905925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,4,power_law_1.2,0.1382591962814331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,power_law_1.01,0.08449919819831848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,4,power_law_1.2,0.5808063983917237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,4,power_law_1.2,1.2423999786376954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,power_law_1.01,0.0917248010635376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,4,power_law_1.2,0.15786880254745483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,power_law_1.01,0.09600639939308167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,4,power_law_1.2,0.16933759450912475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,balanced,2.4413439432779946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,4,power_law_1.2,0.16307200193405152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,4,power_law_1.2,0.21568000316619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,4,power_law_1.2,0.26363520622253417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,power_law_1.01,0.10408960580825806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,4,power_law_1.2,0.32213759422302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,4,power_law_1.2,0.267737603187561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,power_law_1.01,0.1031872034072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,4,power_law_1.2,0.371616005897522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,balanced,3.8947626749674478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,4,power_law_1.2,0.3827264070510864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,4,power_law_1.2,0.5387199878692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,power_law_1.01,0.09429759979248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,4,power_law_1.2,0.6069952011108398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,power_law_1.01,0.10030080080032348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,4,power_law_1.2,0.8938176155090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,power_law_1.01,0.10707199573516846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,4,power_law_1.2,1.0796863555908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,power_law_1.01,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,4,power_law_1.2,1.3478912353515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,4,power_law_1.2,2.3340415954589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,power_law_1.01,0.12646399736404418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,4,power_law_1.2,3.502579116821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,4,power_law_1.2,0.08239359855651855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,power_law_1.01,0.13819520473480223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,4,power_law_1.2,0.07631360292434693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,balanced,7.73086420694987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,4,power_law_1.2,4.947449493408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,4,power_law_1.2,0.07470719814300537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,power_law_1.01,0.16692479848861694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,4,power_law_1.2,6.398643112182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,4,power_law_1.2,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,power_law_1.01,0.25991039276123046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,4,power_law_1.2,8.945785522460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,power_law_1.01,0.30605440139770507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,4,power_law_1.2,0.08339200019836426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,power_law_1.01,0.46197757720947263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,4,power_law_1.2,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,4,power_law_1.2,18.785215759277342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,4,power_law_1.2,0.093612802028656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,power_law_1.01,0.4743040084838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,4,power_law_1.2,0.09191679954528809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,power_law_1.01,0.7819647789001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,4,power_law_1.2,0.09247360229492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,4,power_law_1.2,0.09493759870529175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,power_law_1.01,1.200153636932373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,4,power_law_1.2,0.09962239861488342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,power_law_1.01,1.5416831970214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,4,power_law_1.2,0.10075520277023316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,power_law_1.01,2.64147834777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,4,power_law_1.2,0.10145280361175538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,4,power_law_1.2,0.13439359664916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,power_law_1.01,2.6188543319702147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,4,power_law_1.2,0.1304128050804138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,power_law_1.01,6.3175102233886715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,4,power_law_1.2,0.16687359809875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,4,power_law_1.2,0.16371840238571167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,power_law_1.01,5.77957763671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,4,power_law_1.2,0.2177664041519165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,4,power_law_1.2,0.2355583906173706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,4,power_law_1.2,0.07668480277061462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,power_law_1.01,10.472243499755859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,4,power_law_1.2,0.3583231925964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,4,power_law_1.2,0.06373119950294495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,4,power_law_1.2,0.4110591888427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,4,power_law_1.2,0.0691968023777008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,4,power_law_1.2,0.6588479995727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,power_law_1.01,23.692576599121093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,4,power_law_1.2,0.07742080092430115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,4,power_law_1.2,0.7438079833984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,4,power_law_1.2,0.07775359749794006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,4,power_law_1.2,1.0110272407531737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,4,power_law_1.2,0.08775039911270141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,4,power_law_1.2,1.534982395172119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,4,power_law_1.2,0.09304320216178893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,4,power_law_1.2,2.420217514038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,4,power_law_1.2,0.10119040012359619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,4,power_law_1.2,3.070783996582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,4,power_law_1.2,4.211404800415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,4,power_law_1.2,0.092467200756073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,balanced,0.0413973331451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,balanced,0.05829333265622457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,4,power_law_1.2,0.10092159509658813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,4,power_law_1.2,4.694591903686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,balanced,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,balanced,0.05638400216897329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,balanced,0.12594667077064514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,balanced,0.07899733384450276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,balanced,0.1290186643600464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,4,power_law_1.2,11.370336151123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,balanced,0.1252906620502472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,4,power_law_1.2,0.09736319780349731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,balanced,0.08238400022188823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,balanced,0.12652800480524698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,4,power_law_1.2,0.10252159833908081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,balanced,0.08321600159009297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,balanced,0.127402663230896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,4,power_law_1.2,0.11075199842453003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,balanced,0.1328000028928121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,balanced,0.08441600203514099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,balanced,0.1329813301563263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,4,power_law_1.2,0.12887680530548096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,balanced,0.13354133566220602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,balanced,0.08572799960772197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,balanced,0.13843733072280884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,balanced,0.03598399957021078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,balanced,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,4,power_law_1.2,0.12804479598999025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,balanced,0.1373973290125529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,balanced,0.13888532916704813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,balanced,0.049456000328063965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,balanced,0.0869599978129069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,4,power_law_1.2,0.1457856059074402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,balanced,0.1450506647427877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,balanced,0.07348266740640004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,balanced,0.08784000078837077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,balanced,0.15275200208028158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,4,power_law_1.2,0.20330240726470947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,balanced,0.15355733036994934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,balanced,0.07708266874154408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,balanced,0.09134399890899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,4,power_law_1.2,0.23771519660949708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,balanced,0.16394666830698648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,balanced,0.0768746683994929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,4,power_law_1.2,0.314572811126709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,balanced,0.09144000212351482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,balanced,0.18522665898005167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,balanced,0.07885866860548656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,balanced,0.24149866898854574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,4,power_law_1.2,0.44885759353637694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,balanced,0.09473066528638203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,balanced,0.08061866462230682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,balanced,0.32283200820287067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,balanced,0.09518933296203613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,4,power_law_1.2,0.6928192138671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,balanced,0.0799786647160848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,balanced,0.27450132369995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,balanced,0.10943466424942017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,balanced,0.39922666549682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,4,power_law_1.2,1.0829119682312012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,balanced,0.11016000310579936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,balanced,0.5056693156560262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,balanced,0.1164959967136383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,4,power_law_1.2,1.1600128173828126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,balanced,0.13084800044695535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,4,power_law_1.2,1.7608896255493165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,balanced,0.7420639991760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,balanced,0.08242666721343994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,balanced,0.14882133404413858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,4,power_law_1.2,2.406329536437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,balanced,0.08347200353940327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,balanced,0.9706613222757975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,balanced,0.2021226684252421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,4,power_law_1.2,4.54400634765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,balanced,0.21473600467046103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,balanced,1.4144479433695476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,4,power_law_1.2,4.316185760498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,balanced,0.3044533332188924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,4,power_law_1.2,7.807218933105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,balanced,1.8936479886372883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,balanced,0.38492266337076825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,balanced,0.08635733524958293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,4,power_law_1.2,13.295820617675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,balanced,0.5523413419723511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.01,0.08289920091629029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,balanced,0.08898133039474487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,balanced,2.3587519327799478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.01,0.07957119941711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,balanced,0.0913813312848409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,balanced,0.7199359734853109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.01,0.09476479887962341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,4,power_law_1.2,23.814515686035158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,balanced,0.09373866518338521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.01,0.12836480140686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.01,0.12478079795837402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.01,0.12663040161132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,balanced,1.0595520337422688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.01,0.13096319437026976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,balanced,3.611728032430013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,balanced,0.10626666744550069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.01,0.1388479948043823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,balanced,0.1088693340619405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.01,0.1392192006111145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,balanced,1.3751999537150066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.01,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.01,0.13941760063171388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,balanced,0.11664000153541565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.01,0.14361599683761597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.01,0.05304960012435913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,balanced,0.149509330590566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.01,0.14863359928131104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.01,0.057920002937316896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,balanced,0.16245333353678384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.01,0.15217920541763305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,balanced,1.6983146667480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.01,0.16687359809875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.01,0.08095359802246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.01,0.19679360389709472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.01,0.08286719918251037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.01,0.19701759815216063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,balanced,7.164805094401042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.01,0.0850495994091034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.01,0.1999168038368225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,balanced,0.2286346753438314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.01,0.08748800158500672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.01,0.23189759254455566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,balanced,2.6193493207295737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.01,0.08747519850730896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.01,0.25630080699920654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,balanced,0.3033173282941182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.01,0.08565120100975036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.01,0.3951936006546021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.01,0.09007359743118286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,balanced,0.45138665040334064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.01,0.43242878913879396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.01,0.0995136022567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.01,0.6315264225006103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.01,0.09649279713630676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,balanced,0.5962453285853068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.01,0.7788991928100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.01,0.10219520330429077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.01,1.1643903732299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,balanced,0.8966293334960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.01,0.11249920129776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.01,1.5338687896728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.01,0.12297600507736206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,balanced,5.219776153564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.01,0.13338880538940429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,balanced,1.1856853167215984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.01,1.815225601196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.01,0.13123199939727784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.01,2.8159231185913085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.01,0.17115520238876342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,balanced,1.7620372772216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.01,3.527462387084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.01,0.19883519411087036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,power_law_1.01,0.04672000110149384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.01,0.2652224063873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.01,5.180441665649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.01,0.3033279895782471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,power_law_1.01,0.05514879822731018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,balanced,2.3373066584269204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.01,0.3896320104598999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.01,9.546329498291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,power_law_1.01,0.07772160172462464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.01,0.5557375907897949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,power_law_1.01,0.07831680178642272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,2,power_law_1.2,0.08214399814605713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.01,0.7260608196258544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,power_law_1.01,0.08353279829025269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,balanced,2.923957188924154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,power_law_1.01,0.0870527982711792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.01,1.0792384147644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,2,power_law_1.2,0.09050880074501037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,power_law_1.01,0.09214079976081849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.01,1.5784832000732423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,2,power_law_1.2,0.0847104012966156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.01,2.0171199798583985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,2,power_law_1.2,0.128057599067688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,power_law_1.01,0.09419519901275634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,2,power_law_1.2,0.12511999607086183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.01,2.712384033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,balanced,4.701381365458171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,power_law_1.01,0.09570559859275818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,2,power_law_1.2,0.12286720275878907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.01,3.8388160705566405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,2,power_law_1.2,0.13194880485534669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,2,power_law_1.2,0.14080640077590942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.01,8.161055755615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,power_law_1.01,0.09941120147705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,2,power_law_1.2,0.14085760116577148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,power_law_1.01,0.10170880556106568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,2,power_law_1.2,0.14568959474563598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,power_law_1.01,0.10570240020751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,power_law_1.01,0.11881599426269532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,2,power_law_1.2,0.14407680034637452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,2,power_law_1.2,0.1516543984413147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,power_law_1.01,0.1287551999092102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,2,power_law_1.2,0.14982399940490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,balanced,9.404778798421225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,power_law_1.01,0.13184640407562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,power_law_1.01,0.16195199489593506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,2,power_law_1.2,0.17388800382614136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,power_law_1.01,0.192467200756073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,2,power_law_1.2,0.18551039695739746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,power_law_1.01,0.28879361152648925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,2,power_law_1.2,0.1894271969795227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,power_law_1.01,0.3505728006362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,2,power_law_1.2,0.20305280685424804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,power_law_1.01,0.44785919189453127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,2,power_law_1.2,0.2594239950180054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,power_law_1.01,0.7544511795043946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,2,power_law_1.2,0.30687999725341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,power_law_1.01,0.9356863975524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,2,power_law_1.2,0.41452798843383787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,power_law_1.01,1.4041343688964845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,2,power_law_1.2,0.4108799934387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,power_law_1.01,2.020908737182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,2,power_law_1.2,0.6214911937713623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,power_law_1.01,2.4483455657958983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,2,power_law_1.2,0.8099776268005371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,power_law_1.01,3.5121150970458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,2,power_law_1.2,1.3646400451660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,power_law_1.01,4.653062438964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,2,power_law_1.2,1.5385855674743651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,power_law_1.01,7.791155242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,2,power_law_1.2,2.4662912368774412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,2,power_law_1.2,3.0686336517333985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,power_law_1.01,15.83846435546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,2,power_law_1.2,3.6032894134521483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,2,power_law_1.2,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,2,power_law_1.2,5.867264175415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,2,power_law_1.2,0.06079999804496765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,2,power_law_1.2,11.737049865722657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,2,power_law_1.2,0.05912960171699524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,2,power_law_1.2,0.08024320006370544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,2,power_law_1.2,0.08272640109062195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,2,power_law_1.2,0.08529279828071594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,2,power_law_1.2,0.08661760091781616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,2,power_law_1.2,0.08697599768638611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,2,power_law_1.2,0.09218559861183166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,2,power_law_1.2,0.09022079706192017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,2,power_law_1.2,0.09838719964027405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,2,power_law_1.2,0.10058879852294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,2,power_law_1.2,0.09994239807128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,2,power_law_1.2,0.11350400447845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,2,power_law_1.2,0.12439680099487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,2,power_law_1.2,0.1311360001564026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,2,power_law_1.2,0.1511615991592407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,2,power_law_1.2,0.05375999808311462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,2,power_law_1.2,0.16990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,2,power_law_1.2,0.20618879795074463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,2,power_law_1.2,0.05240319967269898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,2,power_law_1.2,0.27559680938720704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,2,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,2,power_law_1.2,0.29134719371795653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,balanced,0.0581279993057251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,2,power_law_1.2,0.07434880137443542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,2,power_law_1.2,0.4651328086853027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,2,power_law_1.2,0.5102719783782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,2,power_law_1.2,0.07784960269927979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,balanced,0.08084799846013387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,2,power_law_1.2,0.7320384025573731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,2,power_law_1.2,0.08425599932670594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,2,power_law_1.2,1.138803195953369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,balanced,0.12664533654848734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,2,power_law_1.2,0.08638719916343689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,2,power_law_1.2,1.5889023780822753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,2,power_law_1.2,0.08632959723472595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,balanced,0.12442666292190552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,2,power_law_1.2,2.0365375518798827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,balanced,0.12523733576138815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,2,power_law_1.2,2.906809616088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,balanced,0.12600533167521158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,2,power_law_1.2,0.09150720238685608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,2,power_law_1.2,4.145779037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,balanced,0.04049066702524821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,balanced,0.12719999750455221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,2,power_law_1.2,0.09644799828529357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,2,power_law_1.2,7.196889495849609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,balanced,0.12894933422406515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,balanced,0.05635733405749003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,balanced,0.13082666198412576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,balanced,0.07938133180141449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,2,power_law_1.2,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,balanced,0.13172800342241922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,balanced,0.08309866487979889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,2,power_law_1.2,0.09986559748649597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,balanced,0.08332266906897227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,balanced,0.1387999951839447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,2,power_law_1.2,0.10814720392227173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,balanced,0.0846720039844513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,balanced,0.14018133282661438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,2,power_law_1.2,0.11111040115356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,balanced,0.14230400323867798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,balanced,0.08638933300971985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,2,power_law_1.2,0.13262720108032228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,balanced,0.1525173286596934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,balanced,0.08603200316429138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,2,power_law_1.2,0.1408128023147583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,balanced,0.15665599703788757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,2,power_law_1.2,0.15560959577560424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,balanced,0.08737066388130188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,balanced,0.15957333644231161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,2,power_law_1.2,0.2019200086593628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,balanced,0.08916800220807393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,2,power_law_1.2,0.2629568099975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,balanced,0.17055465777715048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,balanced,0.09063466389973958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,balanced,0.19527467091878256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.057043200731277464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,balanced,0.09454400340716045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,2,power_law_1.2,0.39692161083221433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,balanced,0.21520533164342245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,balanced,0.09703466296195984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,balanced,0.037263999382654824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,2,power_law_1.2,0.5314752101898194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.0749888002872467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,balanced,0.10101866722106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,balanced,0.28678399324417114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,balanced,0.05136000116666158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,2,power_law_1.2,0.6932223796844482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,balanced,0.11081066727638245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.11980799436569214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,balanced,0.37650132179260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,balanced,0.07446933289368947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,2,power_law_1.2,1.038764762878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.1198848009109497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,2,power_law_1.2,1.4438207626342774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,balanced,0.510810653368632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,balanced,0.11205333471298218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.12692480087280272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,balanced,0.07814933359622955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,2,power_law_1.2,2.0593664169311525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.1324928045272827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,balanced,0.5965386629104614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,balanced,0.07876266539096832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,balanced,0.12793599565823874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.13335039615631103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,2,power_law_1.2,2.7899648666381838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,balanced,0.08102933565775554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,balanced,0.8856906890869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.764902400970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,balanced,0.1460853318373362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,balanced,0.08341866731643677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,2,power_law_1.2,3.605440139770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.9757439613342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,balanced,0.0839359958966573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,balanced,0.15893866618474325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,2,power_law_1.2,4.577920150756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,balanced,1.140005350112915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.14872959852218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,balanced,0.22452799479166666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.15091840028762818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,2,power_law_1.2,8.358092498779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,balanced,0.27079999446868896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.14910080432891845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,balanced,1.6911892890930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,balanced,0.3880586624145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.17267199754714965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,2,power_law_1.2,15.905548095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,balanced,0.08660800258318584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.1819584012031555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,balanced,0.4726346731185913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,balanced,2.2308425903320312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,balanced,0.08860266208648682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.1783360004425049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.04169600009918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,balanced,0.6979093551635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.25055360794067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.25722880363464357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,balanced,2.8076534271240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.08020480275154114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,balanced,0.8923199971516927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.08107519745826722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.33466880321502684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,power_law_1.01,0.039059200882911684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.0892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.37893118858337405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.08764799833297729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,balanced,1.2960373560587566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,power_law_1.01,0.04570240080356598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.08906880021095276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.5263679981231689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,balanced,0.09404800335566203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.01,0.6658368110656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,power_law_1.01,0.05490559935569763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,balanced,4.13316281636556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.09247999787330627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,balanced,0.09768533706665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.01,0.9397248268127442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.09668480157852173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,balanced,1.7406293551127117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,power_law_1.01,0.07811200022697448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,balanced,0.10199466347694397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.10001280307769775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.01,1.1708928108215333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,power_law_1.01,0.0785152018070221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.10229120254516602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,balanced,0.10729066530863444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.11486719846725464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.01,1.650227165222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,power_law_1.01,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,balanced,0.12112533052762349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.12188160419464111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,power_law_1.01,0.08652799725532531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.01,2.308639907836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,balanced,0.12572800119717917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,balanced,2.192037264506022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.12416640520095826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.01,2.8634687423706056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,balanced,0.13794133067131042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,power_law_1.01,0.08950399756431579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.13037439584732055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.1664896011352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,balanced,0.18629332383473715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.01,4.080659103393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.18078080415725709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,balanced,0.22428266207377115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,balanced,8.139269510904947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.2447808027267456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.01,7.967955017089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,balanced,0.3249066670735677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,power_law_1.01,0.09444479942321778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.40416641235351564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,balanced,3.3331305185953775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,balanced,0.4251146713892619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,power_law_1.01,0.09807999730110169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,0.5043456077575683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,0.7065919876098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,balanced,0.6258773406346639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,0.9042431831359863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,power_law_1.01,0.10304000377655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,1.3255295753479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,balanced,0.8269866307576498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,1.7572351455688477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,power_law_1.01,0.10500479936599731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,balanced,1.2398933569590251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.01,2.1997440338134764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,power_law_1.01,0.10913280248641968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.01,3.2413822174072267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,power_law_1.01,0.11887359619140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,balanced,1.640325387318929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,power_law_1.01,0.13683199882507324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.01,6.4219970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,power_law_1.01,0.14431359767913818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,balanced,6.827599843343099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,power_law_1.01,0.15604480504989623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,balanced,2.4431306521097818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,power_law_1.01,0.20430080890655516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.01,0.2547327995300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.056979197263717654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,balanced,3.244762738545736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.06303359866142273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.01,0.3600703954696655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.07467520236968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.01,0.45822720527648925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.12357759475708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.01,0.6668735980987549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,balanced,4.039807955423991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.12532479763031007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.01,0.8696127891540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.12723840475082399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.01,1.2844479560852051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.13154560327529907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.1345088005065918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.01,1.686502456665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.9784064292907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,balanced,6.4347788492838545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.01,2.4854080200195314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.9749631881713867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.01,3.3031936645507813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.14837119579315186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.15017600059509278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.01,4.116134262084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.1498047947883606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,power_law_1.01,6.503826904296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.17158399820327758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.17834880352020263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,power_law_1.01,12.945420837402343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.1780992031097412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.23171839714050294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,balanced,12.921119689941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.24714879989624022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.25564160346984866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.3330048084259033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.37792000770568845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.5131840229034423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,1,power_law_1.2,0.6728576183319092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,1,power_law_1.2,0.9341695785522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,1,power_law_1.2,1.1353216171264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,1,power_law_1.2,1.6563264846801757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,1,power_law_1.2,2.2908863067626952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,1,power_law_1.2,2.874496078491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,1,power_law_1.2,4.108006286621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.04217599928379059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.04965119957923889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,1,power_law_1.2,7.9735870361328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.05375360250473023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.08061439990997314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.0834496021270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.0886847972869873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.08872960209846496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.0899392008781433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.0937279999256134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.09144319891929627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.09717119932174682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.10135040283203126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.10173439979553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.11479040384292602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.12284799814224243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.12679680585861205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,1,power_law_1.2,0.039904001355171206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.133024001121521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.1742784023284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,1,power_law_1.2,0.04665600061416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,1,power_law_1.2,0.053472000360488894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.18264960050582885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,1,power_law_1.2,0.07527679800987244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.2420032024383545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,1,power_law_1.2,0.07724159955978394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.295743989944458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,1,power_law_1.2,0.08648319840431214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.4096384048461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,1,power_law_1.2,0.08666880130767822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,1,power_law_1.2,0.09032319784164429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,0.5101439952850342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,0.7085696220397949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,0.9087103843688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,1,power_law_1.2,0.09132159948348999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,1.3322239875793458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,1.7670400619506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,1,power_law_1.2,0.09502080082893372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,1,power_law_1.2,2.20578556060791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,1,power_law_1.2,3.2591678619384767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,1,power_law_1.2,0.10561280250549317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,1,power_law_1.2,6.450374603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,1,power_law_1.2,0.10766719579696656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,1,power_law_1.2,0.11090559959411621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,1,power_law_1.2,0.11683199405670167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,balanced,0.08741866548856099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,1,power_law_1.2,0.13649280071258546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,balanced,0.0832426647345225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,1,power_law_1.2,0.14147839546203614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,1,power_law_1.2,0.15772160291671752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,balanced,0.10205866893132527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,1,power_law_1.2,0.20700159072875976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,balanced,0.15588800112406412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.2,0.2548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,balanced,0.27641600370407104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.2,0.35824639797210694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.2,0.456601619720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,balanced,0.49878398577372235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.2,0.6572991847991944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,balanced,0.5003626743952433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,balanced,0.06228800117969513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.2,0.8585920333862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.2,1.2740991592407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,balanced,0.4983573357264201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,balanced,0.06376533210277557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.2,1.6591999053955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,balanced,0.07226666808128357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,balanced,0.4993120034535726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.2,2.4624959945678713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,balanced,0.10331733028093974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,balanced,0.4988906780878703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.2,3.25494384765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,balanced,0.16197866201400757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,balanced,0.4952746629714966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,balanced,0.274944007396698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.2,4.064608001708985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,balanced,0.27794132630030316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,balanced,0.4980586767196655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,1,power_law_1.2,6.454688262939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,balanced,0.2775999903678894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,balanced,0.4983893235524495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,balanced,0.2788640062014262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,1,power_law_1.2,12.765856170654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,balanced,0.5001813173294067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,balanced,0.2791573405265808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,balanced,0.5068213144938151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,balanced,0.2831679979960124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,balanced,0.28405332565307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,balanced,0.5104586680730184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,balanced,0.2876480023066203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,balanced,0.5150453249613444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,balanced,0.2906240026156108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,balanced,0.5377600193023682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,balanced,0.29787200689315796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,balanced,0.05797333518664042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,balanced,0.5550826787948608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,balanced,0.3004960020383199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,balanced,0.05514133473237356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,balanced,0.3086079955101013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,balanced,0.5725119908650717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,balanced,0.07518933216730754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,balanced,0.32259732484817505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,balanced,0.10134399930636089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,balanced,0.615285317103068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,balanced,0.3371359904607137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,balanced,0.17916266123453775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,balanced,0.2691253423690796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,balanced,0.6392106612523397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,balanced,0.3606026570002238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,balanced,0.2722880045572917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,balanced,0.27190399169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,balanced,0.39652268091837567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,balanced,0.27436800797780353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,balanced,0.676362673441569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,balanced,0.2749920090039571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.01,0.2907263994216919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,balanced,0.27772267659505206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.01,0.176256000995636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,balanced,0.4386560122172038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.01,0.4978303909301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,balanced,0.2799253265062968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.01,0.275603199005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.01,0.20047359466552733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,balanced,0.8145600159962972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,balanced,0.28245866298675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.01,0.1348736047744751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.01,0.17277439832687377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,balanced,0.49161601066589355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,balanced,0.2847839991251628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.01,0.2665600061416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.01,0.11982719898223877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.01,0.3340480089187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,balanced,0.2946559985478719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.01,0.16469759941101075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.01,0.4271423816680908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,balanced,0.29627732435862225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,balanced,0.6168959935506185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.01,0.174726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.01,0.40824317932128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,balanced,0.8976106643676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,balanced,0.3046986659367879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.01,0.4159103870391846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.01,0.24147839546203614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.01,0.4380928039550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.01,0.23534080982208253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.01,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.01,0.2603456020355225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.01,0.44186878204345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,balanced,0.724565347035726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.01,0.2533567905426025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.01,0.4345344066619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.01,0.2525504112243652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,balanced,0.3216800093650818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.01,0.48375678062438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,balanced,1.1797866821289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.01,0.25208320617675783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.01,0.47377920150756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.01,0.26791679859161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.01,0.5227968215942382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.01,0.27175040245056153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.01,0.5374335765838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,power_law_1.01,0.1838655948638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.01,0.2967168092727661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,balanced,0.994383970896403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.01,0.5990528106689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,power_law_1.01,0.27515521049499514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.01,0.2957247972488403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.01,0.5938623905181885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,power_law_1.01,0.09132800102233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.01,0.30108160972595216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.01,0.7177663803100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,balanced,0.34379732608795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,power_law_1.01,0.12273279428482056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.01,0.3444159984588623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.01,0.6937407970428466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,balanced,1.4348799387613933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,power_law_1.01,0.15695359706878662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.01,0.36528639793395995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.01,0.8622719764709472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,balanced,0.37248531977335614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,power_law_1.01,0.20263679027557374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.01,0.4435840129852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.01,0.8997247695922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,power_law_1.01,0.23011200428009032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.01,0.448851203918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,balanced,0.3986026843388875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.01,1.2313728332519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,balanced,1.2563626766204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.01,0.5416959762573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,power_law_1.01,0.24297599792480468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.01,1.5249088287353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,power_law_1.01,0.24697599411010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.01,0.6460864067077636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,balanced,0.46688000361124676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.01,2.0639999389648436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,power_law_1.01,0.23335680961608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.01,0.8600959777832031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,power_law_1.01,0.26407680511474607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.01,2.727622413635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.01,1.0434304237365724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,power_law_1.01,0.28197760581970216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,balanced,0.5324693520863851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,power_law_1.01,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.01,1.4973504066467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.01,3.6628543853759767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,power_law_1.01,0.28825600147247316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,balanced,1.7327307065327961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.01,1.9509952545166016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.01,5.159308624267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,power_law_1.01,0.3101759910583496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,balanced,0.7403466701507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.01,2.470342445373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,power_law_1.01,0.33115520477294924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,power_law_1.01,0.39598081111907957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,balanced,1.5363306999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.01,10.420480346679687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.01,4.1219135284423825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,power_law_1.01,0.38611199855804446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.01,7.6868034362792965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,balanced,0.8612053394317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.01,0.3856512069702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.01,0.4734975814819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.01,0.5726528167724609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,balanced,1.2649226983388264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.01,0.6922239780426025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.01,0.9172543525695801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,balanced,2.6779839197794595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.01,1.3319487571716309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.01,1.5348799705505372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,16,power_law_1.2,0.2875456094741821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,balanced,2.3437439600626626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.01,2.4464448928833007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,16,power_law_1.2,0.46472320556640623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.01,3.273964691162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,16,power_law_1.2,0.14477440118789672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,balanced,1.6609387397766113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,power_law_1.01,4.089369583129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,16,power_law_1.2,0.2012928009033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,16,power_law_1.2,0.26905601024627684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.01,6.103590393066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,16,power_law_1.2,0.2677695989608765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,16,power_law_1.2,0.38587520122528074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,16,power_law_1.2,0.42535037994384767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.01,15.134086608886719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,16,power_law_1.2,0.43109760284423826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,16,power_law_1.2,0.405401611328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,16,power_law_1.2,0.4494272232055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.17461760044097902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,16,power_law_1.2,0.47234559059143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,balanced,2.06988795598348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,16,power_law_1.2,0.25470719337463377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,16,power_law_1.2,0.47057280540466306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,16,power_law_1.2,0.5052735805511475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.09099519848823548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,16,power_law_1.2,0.11212799549102784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,16,power_law_1.2,0.5053631782531738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,16,power_law_1.2,0.14321919679641723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,16,power_law_1.2,0.5337215900421143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.17866239547729493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,16,power_law_1.2,0.528991985321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.2335103988647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.24067199230194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,16,power_law_1.2,0.6579455852508544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.22654080390930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,16,power_law_1.2,0.669055986404419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,16,power_law_1.2,0.22858240604400634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,16,power_law_1.2,0.7706880092620849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.25253119468688967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,16,power_law_1.2,0.7704192161560058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.27387518882751466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,16,power_law_1.2,1.037484836578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.2731328010559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,balanced,5.297594706217448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,16,power_law_1.2,1.0072128295898437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.27665278911590574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,16,power_law_1.2,1.3939647674560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,balanced,4.548437436421712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,balanced,3.277157465616862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.30707199573516847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,16,power_law_1.2,1.7590848922729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,16,power_law_1.2,0.2975231885910034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,16,power_law_1.2,3.247488021850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,16,power_law_1.2,0.3222208023071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,16,power_law_1.2,3.4075649261474608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,16,power_law_1.2,0.3711616039276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,16,power_law_1.2,4.29791374206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,0.3916800022125244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,16,power_law_1.2,6.4661308288574215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,0.4793856143951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,0.4795072078704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,16,power_law_1.2,16.989561462402342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,0.6125247955322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,0.734003210067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,0.934547233581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,1.3064576148986817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,1.8814464569091798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,2.4637184143066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,16,power_law_1.2,3.3226943969726563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,16,power_law_1.2,4.541888046264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,16,power_law_1.2,9.392441558837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,balanced,6.678469340006511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,balanced,0.06887466708819072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,balanced,0.0713866651058197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,balanced,0.09850133458773296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,balanced,0.1562879979610443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,balanced,0.26710400978724164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,balanced,0.49688533941904706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,16,power_law_1.2,0.16647039651870726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,balanced,0.49853332837422687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,balanced,0.4989226659138997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,16,power_law_1.2,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,balanced,0.5007573366165161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,16,power_law_1.2,0.08909440040588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,balanced,0.5044960180918375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,16,power_law_1.2,0.11692160367965698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,balanced,0.4984746774037679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,16,power_law_1.2,0.1363968014717102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,balanced,0.5012533267339071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,balanced,0.5024799903233846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,16,power_law_1.2,0.15242880582809448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,balanced,0.5065706570943197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,16,power_law_1.2,0.23899519443511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,balanced,0.5134880145390829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,16,power_law_1.2,0.23443200588226318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,16,power_law_1.2,0.23821439743041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,balanced,0.5170240004857382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,16,power_law_1.2,0.2444927930831909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,balanced,0.5269226630528768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,16,power_law_1.2,0.257094407081604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,balanced,0.5512746572494507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,16,power_law_1.2,0.2819839954376221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,balanced,0.5710826714833578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,16,power_law_1.2,0.2809920072555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,balanced,0.5919466813405355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,16,power_law_1.2,0.2822144031524658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,balanced,0.6375893354415894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,16,power_law_1.2,0.3274431943893433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,balanced,0.05218133330345154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,16,power_law_1.2,0.36579840183258056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,balanced,0.6850186983744303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,balanced,0.0555626650651296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,16,power_law_1.2,0.4069056034088135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,balanced,0.07152533531188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,balanced,0.10377599795659383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,balanced,0.735157330830892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,balanced,0.16168000300725302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,16,power_law_1.2,0.4440000057220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,balanced,0.2763520081837972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,balanced,0.2778826753298442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,balanced,0.2786080042521159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,balanced,0.8865813414255778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,balanced,0.2805013259251912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.2,0.4063744068145752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,balanced,0.2817866603533427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,balanced,0.2848320007324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.2,0.5696320056915283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,balanced,0.2861386736234029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.2,0.680787181854248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,balanced,0.2903520067532857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,balanced,0.9807306925455729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.2,0.8017024040222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,balanced,0.2940586606661479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,balanced,0.30430932839711505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.2,1.0542592048645019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,balanced,0.3062240084012349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.2,1.3839424133300782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,balanced,0.3147733410199483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.2,2.317241668701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,balanced,0.3297226627667745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.2,3.309280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,balanced,1.2952053546905518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.01,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,balanced,0.3470613161722819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.2,4.259545516967774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.01,0.2645695924758911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,balanced,0.3868853251139323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.01,0.1514623999595642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,16,power_law_1.2,5.113587188720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,balanced,0.41811199982961017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.01,0.17119359970092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.01,0.2231935977935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.2,8.569171142578124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,balanced,0.4776266813278198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.01,0.28219521045684814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,balanced,0.04977599779764811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.01,0.10860799551010132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,balanced,1.62173859278361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.01,0.38276479244232176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,balanced,0.05755733450253805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.2,17.79956512451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.01,0.15569280385971068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,balanced,0.5425013303756714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,balanced,0.07646933197975159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.01,0.39380478858947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.01,0.10905599594116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,balanced,0.11412800351778667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.01,0.41276798248291013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.01,0.10528000593185424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,balanced,0.18054932355880737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.01,0.41000962257385254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.01,0.13452160358428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,balanced,0.2718293269475301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,balanced,0.6892533302307129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.01,0.43482241630554197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,balanced,0.27525333563486737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.01,0.16996480226516725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.01,0.44858241081237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,balanced,0.27667733033498126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.01,0.21100161075592042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,balanced,0.2782133420308431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.01,0.44208641052246095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.01,0.2212224006652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,balanced,1.9868426322937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,balanced,0.27957866589228314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,balanced,0.8124852975209554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.01,0.4733312129974365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.01,0.23441920280456544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,balanced,0.28332799673080444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.01,0.4847360134124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.01,0.23138558864593506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,balanced,0.2860373258590698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.01,0.5027967929840088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.01,0.25077118873596194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,balanced,0.2899199922879537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.01,0.24928638935089112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.01,0.487443208694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,balanced,0.2937493324279785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.01,0.25769600868225095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.01,0.5753215789794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,balanced,0.30533866087595624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,balanced,1.1173280080159504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.01,0.27039361000061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.01,0.5833727836608886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,balanced,0.3088480035463969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.01,0.686732816696167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.01,0.28063359260559084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,balanced,0.32068800926208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,power_law_1.01,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.01,0.30316159725189207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.01,0.6444672107696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.01,0.3093760013580322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,power_law_1.01,0.16648319959640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.01,0.8290111541748046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,power_law_1.01,0.0882752001285553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,8,power_law_1.2,0.17493120431900025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.01,0.3455424070358276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.01,0.873862361907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,power_law_1.01,0.11619839668273926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.01,0.3755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,8,power_law_1.2,0.23836159706115723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.01,1.2022975921630858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,power_law_1.01,0.14394240379333495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,balanced,0.3435680071512858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,balanced,3.050352096557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,balanced,1.4340052604675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,8,power_law_1.2,0.11383680105209351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.01,0.4296127796173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.01,1.4434816360473632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,power_law_1.01,0.17815040349960326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,8,power_law_1.2,0.13671679496765138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.01,0.4525760173797607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,power_law_1.01,0.2241215944290161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.01,2.149235153198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,8,power_law_1.2,0.20703999996185302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.01,0.5496831893920898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,power_law_1.01,0.2259648084640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.01,2.5070016860961912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,8,power_law_1.2,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.01,0.6253888130187988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,power_law_1.01,0.2321023941040039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,8,power_law_1.2,0.34688639640808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.01,3.4038272857666017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.01,0.8757760047912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,power_law_1.01,0.2465536117553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,8,power_law_1.2,0.36805119514465334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,8,power_law_1.2,0.40108799934387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,balanced,0.3702133496602376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,power_law_1.01,0.25798399448394777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.01,1.062828826904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.01,4.685184097290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,8,power_law_1.2,0.41550722122192385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,power_law_1.01,0.2678272008895874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.01,1.4811327934265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,balanced,0.41940800348917645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,8,power_law_1.2,0.4248640060424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,power_law_1.01,0.2647167921066284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.01,8.859161376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,balanced,1.786138693491618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.01,1.8075008392333984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,8,power_law_1.2,0.4373824119567871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,power_law_1.01,0.29763839244842527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,balanced,0.4684213399887085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,8,power_law_1.2,0.4400832176208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.01,2.2590143203735353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,power_law_1.01,0.31308159828186033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,8,power_law_1.2,0.452953577041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,power_law_1.01,0.3303679943084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,balanced,0.5775466759999593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.01,3.727436828613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,8,power_law_1.2,0.5123839855194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,power_law_1.01,0.3737472057342529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,8,power_law_1.2,0.5140480041503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.01,7.001197052001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,8,power_law_1.2,0.5497983932495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,balanced,0.6658453146616617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,8,power_law_1.2,0.5910975933074951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,power_law_1.01,0.40790400505065916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,8,power_law_1.2,0.6572671890258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,8,power_law_1.2,0.7706304073333741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,balanced,0.9521173636118571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,8,power_law_1.2,0.7551104068756104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,power_law_1.01,0.40170879364013673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,8,power_law_1.2,0.8774463653564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,power_law_1.01,0.5090943813323975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,8,power_law_1.2,0.9766464233398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,power_law_1.01,0.6439104080200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,8,power_law_1.2,1.334943962097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,power_law_1.01,0.735487985610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,balanced,2.7513707478841147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,balanced,1.1420799891153972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,8,power_law_1.2,1.910540771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,power_law_1.01,0.9749504089355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,8,power_law_1.2,2.2704704284667967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,power_law_1.01,1.244358444213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,balanced,6.250138600667317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,8,power_law_1.2,3.181939125061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,power_law_1.01,1.8473087310791017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,8,power_law_1.2,3.704345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,power_law_1.01,2.359334373474121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,balanced,1.663845380147298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,8,power_law_1.2,6.363616180419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,power_law_1.01,3.363673782348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,power_law_1.01,3.75280647277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,8,power_law_1.2,13.342860412597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,power_law_1.01,6.6331329345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,power_law_1.01,12.353913879394531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,balanced,2.192570686340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,balanced,2.7276748021443686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,balanced,5.357205073038737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,8,power_law_1.2,0.10945279598236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,balanced,4.354906717936198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,8,power_law_1.2,0.1561728000640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,8,power_law_1.2,0.07303680181503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,8,power_law_1.2,0.10799360275268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,8,power_law_1.2,0.13270399570465088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,8,power_law_1.2,0.16303999423980714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,8,power_law_1.2,0.2121216058731079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,8,power_law_1.2,0.23648641109466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,8,power_law_1.2,0.22533760070800782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,8,power_law_1.2,0.23739519119262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,8,power_law_1.2,0.2574656009674072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,8,power_law_1.2,0.26501760482788084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,8,power_law_1.2,0.2770047903060913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,8,power_law_1.2,0.2844928026199341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,8,power_law_1.2,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,8,power_law_1.2,0.3158400058746338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,8,power_law_1.2,0.31548800468444826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,8,power_law_1.2,0.373088002204895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,8,power_law_1.2,0.4059904098510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,8,power_law_1.2,0.4742015838623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,8,power_law_1.2,0.48912639617919923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,8,power_law_1.2,0.576204776763916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,8,power_law_1.2,0.6970816135406495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,8,power_law_1.2,0.9263680458068848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,8,power_law_1.2,1.1797632217407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,balanced,8.688837051391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,8,power_law_1.2,0.11859840154647827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,8,power_law_1.2,1.8129152297973632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,8,power_law_1.2,0.1631999969482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,balanced,0.06311466793219249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,8,power_law_1.2,2.1677696228027346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,8,power_law_1.2,0.07868800163269044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,balanced,0.07186666627724965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,8,power_law_1.2,2.8795839309692384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,8,power_law_1.2,0.09998080134391785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,balanced,0.09937066833178203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,balanced,0.15983999768892923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,8,power_law_1.2,0.13575040102005004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,8,power_law_1.2,4.510540771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,8,power_law_1.2,0.16238080263137816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,balanced,0.2677599986394246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,balanced,0.5012960036595663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,8,power_law_1.2,0.2082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,8,power_law_1.2,9.560959625244141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,balanced,0.5027413368225098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,8,power_law_1.2,0.2296895980834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,balanced,0.5059413512547811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,8,power_law_1.2,0.24119679927825927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,balanced,0.5092213153839111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,8,power_law_1.2,0.24465279579162597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,balanced,0.5116320053736368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,8,power_law_1.2,0.26720640659332273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,balanced,0.5063199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,8,power_law_1.2,0.26206719875335693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,balanced,0.5068586667378744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,8,power_law_1.2,0.27582080364227296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,balanced,0.5141173203786215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,balanced,0.05063466727733612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,8,power_law_1.2,0.30076160430908205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,balanced,0.5203359921773275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,balanced,0.055914665261904396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,8,power_law_1.2,0.3262399911880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,balanced,0.07264000177383423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,balanced,0.5288213491439819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,balanced,0.10565867026646932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,8,power_law_1.2,0.33584640026092527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,balanced,0.5327253341674805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,balanced,0.16476800044377646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,balanced,0.2811200022697449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,8,power_law_1.2,0.4043327808380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,balanced,0.5421919822692871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,balanced,0.2831626733144124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,balanced,0.5695679982503256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,balanced,0.2850240071614583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,balanced,0.28595199187596637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,balanced,0.5978666543960571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,balanced,0.28782933950424194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,8,power_law_1.2,0.4361855983734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,balanced,0.29129600524902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,balanced,0.29555733998616535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,balanced,0.634773333867391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.01,0.10895359516143799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,balanced,0.298362672328949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,8,power_law_1.2,0.44931840896606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,balanced,0.6879200140635172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,balanced,0.30293333530426025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,8,power_law_1.2,0.5530496120452881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,balanced,0.31035733222961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.01,0.15267839431762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,balanced,0.3166453242301941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,8,power_law_1.2,0.6760000228881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,balanced,0.7661653359731039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.01,0.08462079763412475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,balanced,0.3276533285776774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,8,power_law_1.2,0.8603967666625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,balanced,0.3482453425725301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,8,power_law_1.2,1.0119808197021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.01,0.15155199766159058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,balanced,0.3866080045700073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,balanced,0.8538186550140381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,balanced,0.06018666426340739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,8,power_law_1.2,1.519430446624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.01,0.20364799499511718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,balanced,0.06881066660086314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,balanced,0.4328266779581706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,8,power_law_1.2,2.0249984741210936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,balanced,0.08355733752250671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.01,0.27720959186553956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,balanced,0.11921067039171855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,8,power_law_1.2,2.692198371887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,balanced,0.47065067291259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,balanced,1.035925308863322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,balanced,0.16979734102884927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.01,0.3701440095901489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,balanced,0.28793599208196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,8,power_law_1.2,3.436659240722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,balanced,0.2913386623064677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,balanced,0.5558826526006063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.01,0.39626240730285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,balanced,0.29285333553949994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,8,power_law_1.2,4.510982513427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.01,0.3791359901428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,balanced,0.295199990272522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,balanced,1.1980000336964924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.01,0.41202559471130373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,balanced,0.29772265752156574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,balanced,0.6478240092595419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,balanced,0.3012213309605916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,8,power_law_1.2,7.7472381591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.01,0.4260672092437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.01,0.07610880136489868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,balanced,0.30780800183614093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.01,0.4252927780151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,balanced,0.3110666672388713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.01,0.09960319995880126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,balanced,0.31943466265996295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.01,0.44658560752868653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,8,power_law_1.2,16.430514526367187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,balanced,0.8487839698791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,balanced,0.33486398061116535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.01,0.08565760254859925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.01,0.4712512016296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,balanced,0.3426133394241333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.01,0.4914559841156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,balanced,1.608890692392985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.01,0.10351359844207764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,balanced,0.35556264718373615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.01,0.4812863826751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.01,0.13621759414672852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.01,0.5080832004547119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,balanced,1.0432373682657878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.01,0.16460800170898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.01,0.5614336013793946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.01,0.22351360321044922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,balanced,0.39589866002400714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.01,0.609881591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.01,0.23576319217681885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.01,0.6918144226074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.01,0.23040640354156494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.01,0.7067967891693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,balanced,2.030186653137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,balanced,1.458661397298177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.01,0.8530879974365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.01,0.2298815965652466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.01,0.9235008239746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.01,0.2578495979309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,balanced,0.456767996152242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.01,0.2526592016220093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.01,1.2490431785583496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.01,0.26270079612731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.01,1.5042367935180665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,balanced,0.5439733266830444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.01,0.27241599559783936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.01,2.086150360107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,balanced,0.6190293232599894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.01,0.29431040287017823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.01,2.6181312561035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,balanced,1.8028799692789714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.01,0.30169599056243895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.01,3.400646209716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,balanced,0.797269344329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,balanced,2.485760052998861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.01,0.3209471940994263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.01,0.36368000507354736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.01,5.245420837402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.01,0.3799871921539307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,balanced,0.9491360187530518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.01,0.4424895763397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.01,10.141069030761718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.01,0.5090943813323975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.01,0.6321280002593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,balanced,1.3756106694539387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.01,0.7198912143707276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,balanced,2.2878293991088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.01,0.9491392135620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.01,1.203660774230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,balanced,1.6793440183003743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.01,1.6660863876342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.01,2.1065792083740233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,balanced,4.103610674540202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.01,2.749945640563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,balanced,2.48633607228597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.01,4.201932907104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,power_law_1.01,0.09137279987335205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.01,8.605120086669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,power_law_1.01,0.1161344051361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,power_law_1.01,0.0981760025024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,balanced,3.5097812016805015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,power_law_1.01,0.10181119441986083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,power_law_1.01,0.14636800289154053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,balanced,3.290074666341146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,4,power_law_1.2,0.10766719579696656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,power_law_1.01,0.17818880081176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,4,power_law_1.2,0.15789439678192138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,power_law_1.01,0.2258687973022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,4,power_law_1.2,0.08820480108261108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,power_law_1.01,0.23758718967437745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,4,power_law_1.2,0.13626879453659058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,power_law_1.01,0.2562688112258911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,4,power_law_1.2,0.17516160011291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,power_law_1.01,0.2549567937850952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,4,power_law_1.2,0.24427518844604493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,power_law_1.01,0.2627840042114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,4,power_law_1.2,0.36382079124450684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,power_law_1.01,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,balanced,4.099605242411296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,4,power_law_1.2,0.3793344020843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,power_law_1.01,0.28805758953094485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,power_law_1.01,0.3186367988586426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,4,power_law_1.2,0.40903677940368655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,power_law_1.01,0.33413760662078856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,4,power_law_1.2,0.41023998260498046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,power_law_1.01,0.3515199899673462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,4,power_law_1.2,0.4388415813446045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,power_law_1.01,0.3849152088165283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,4,power_law_1.2,0.46073598861694337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,4,power_law_1.2,0.4577343940734863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,power_law_1.01,0.45210881233215333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,balanced,8.137242635091146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,4,power_law_1.2,0.47542400360107423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,4,power_law_1.2,0.5003967761993409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,4,power_law_1.2,0.507596778869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,power_law_1.01,0.4818240165710449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,4,power_law_1.2,0.5440320014953614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,power_law_1.01,0.6126848220825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,power_law_1.01,0.7558207988739014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,4,power_law_1.2,0.599180793762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,balanced,6.545696258544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,power_law_1.01,0.9078847885131835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,4,power_law_1.2,0.6523136138916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,balanced,6.880399703979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,power_law_1.01,1.206726360321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,4,power_law_1.2,0.7393216133117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,power_law_1.01,1.6072256088256835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,4,power_law_1.2,0.753439998626709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,power_law_1.01,2.1482112884521483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,4,power_law_1.2,0.9099072456359864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,4,power_law_1.2,1.0579008102416991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,power_law_1.01,3.496531295776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,4,power_law_1.2,1.3226752281188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,power_law_1.01,4.181158447265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,4,power_law_1.2,1.6566656112670899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,power_law_1.01,5.079436874389648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,4,power_law_1.2,2.6430080413818358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,power_law_1.01,8.489574432373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,4,power_law_1.2,2.8678335189819335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,4,power_law_1.2,3.8576126098632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,4,power_law_1.2,0.07256320118904114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,power_law_1.01,16.17439422607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,4,power_law_1.2,5.724313735961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,4,power_law_1.2,0.09372159838676453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,4,power_law_1.2,0.06718720197677612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,4,power_law_1.2,11.876588439941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,4,power_law_1.2,0.09111040234565734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,4,power_law_1.2,0.12071039676666259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,4,power_law_1.2,0.1512511968612671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,4,power_law_1.2,0.20974719524383545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,4,power_law_1.2,0.21050879955291749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,4,power_law_1.2,0.22834560871124268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,4,power_law_1.2,0.23423359394073487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,balanced,13.141797383626303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,4,power_law_1.2,0.25109760761260985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,4,power_law_1.2,0.266431999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,4,power_law_1.2,0.27370240688323977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,4,power_law_1.2,0.28291199207305906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,4,power_law_1.2,0.2929984092712402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,4,power_law_1.2,0.3174272060394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,4,power_law_1.2,0.319980788230896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,4,power_law_1.2,0.3721920013427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,4,power_law_1.2,0.3924351930618286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,4,power_law_1.2,0.48587517738342284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,4,power_law_1.2,0.5011903762817382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,4,power_law_1.2,0.6742784023284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,4,power_law_1.2,0.0880511999130249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,4,power_law_1.2,0.7420671939849853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,4,power_law_1.2,0.11590399742126464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,4,power_law_1.2,1.0390399932861327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,4,power_law_1.2,0.07676799893379212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,4,power_law_1.2,0.10220799446105958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,4,power_law_1.2,1.2949503898620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,4,power_law_1.2,0.13045120239257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,4,power_law_1.2,1.7659711837768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,4,power_law_1.2,0.15845760107040405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,4,power_law_1.2,0.21671679019927978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,4,power_law_1.2,2.4779264450073244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,4,power_law_1.2,0.2302527904510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,4,power_law_1.2,2.9763200759887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,4,power_law_1.2,0.23812479972839357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,balanced,0.06449066599210103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,4,power_law_1.2,4.489363098144532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,4,power_law_1.2,0.2543231964111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,balanced,0.07343466579914093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,4,power_law_1.2,0.2731647968292236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,balanced,0.10285333792368571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,4,power_law_1.2,9.720806121826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,4,power_law_1.2,0.2742527961730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,balanced,0.15945600469907126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,4,power_law_1.2,0.27993600368499755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,balanced,0.27504533529281616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,4,power_law_1.2,0.31020159721374513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,balanced,0.5115573406219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,4,power_law_1.2,0.35149440765380857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,balanced,0.515445351600647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,4,power_law_1.2,0.36031360626220704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,balanced,0.5174560149510702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,4,power_law_1.2,0.3982656002044678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,balanced,0.5215306679407755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,balanced,0.5256906747817993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,balanced,0.5198613405227661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,4,power_law_1.2,0.4898687839508057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,balanced,0.5224800109863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,balanced,0.5289440155029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,4,power_law_1.2,0.5273280143737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,balanced,0.5351253350575765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,4,power_law_1.2,0.6428287982940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,balanced,0.5440586805343628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,4,power_law_1.2,0.7743360042572022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,balanced,0.5511626799901327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,4,power_law_1.2,1.0190655708312988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,balanced,0.5641866525014242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,balanced,0.6030453443527222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,4,power_law_1.2,1.3482368469238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,4,power_law_1.2,1.6810623168945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,balanced,0.6492319901784261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,4,power_law_1.2,2.360697555541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,balanced,0.05978666742642721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,balanced,0.7244479656219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,balanced,0.0761653333902359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,4,power_law_1.2,3.5289470672607424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,balanced,0.1095199982325236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,balanced,0.1738613247871399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,balanced,0.8048373063405355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,4,power_law_1.2,4.270214462280274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,balanced,0.29443732897440594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,balanced,0.2972533305486043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,balanced,0.301530659198761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,4,power_law_1.2,5.6737407684326175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,balanced,0.9500532944997152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,balanced,0.30691200494766235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,balanced,0.08136533200740814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,balanced,0.3075733383496602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,balanced,0.08825066685676575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,balanced,0.3150186737378438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,4,power_law_1.2,9.806143951416015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,balanced,0.10257599751154582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,balanced,0.3282240033149719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,balanced,1.0875519911448162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,balanced,0.13768000404040018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,balanced,0.32465600967407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,balanced,0.34563732147216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,balanced,0.19563200076421103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,4,power_law_1.2,18.521638488769533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,balanced,0.3253493309020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,balanced,0.35117868582407635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,balanced,0.32865599791208905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,balanced,0.3548053503036499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,balanced,1.449343999226888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,balanced,0.33222933610280353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,balanced,0.3785546620686849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,balanced,0.33666133880615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,balanced,0.40488000710805255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,balanced,0.3404266834259033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,balanced,0.4552053213119507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,balanced,0.34887464841206867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,balanced,0.5286933183670044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,balanced,1.7617066701253254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,balanced,0.35804800192515057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,balanced,0.5684640010197958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,balanced,0.3657279809315999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,balanced,0.3768639961878459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,balanced,0.7158559958140055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,balanced,0.39722132682800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,balanced,0.4128853480021159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,balanced,0.8743840058644613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.01,0.07456640005111695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,balanced,0.4543253183364868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.01,0.058873599767684935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,balanced,2.461018721262614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.01,0.09960960149765015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.01,0.07367039918899536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.01,0.0822655975818634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.01,0.07145599722862243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.01,0.134169602394104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,balanced,1.1953173478444417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.01,0.09492480158805847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.01,0.20562560558319093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,balanced,0.5379626750946045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.01,0.12924799919128419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.01,0.29280641078948977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.01,0.1669119954109192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.01,0.36099839210510254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.01,0.393670392036438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.01,0.22112638950347902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.01,0.4017280101776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.01,0.23100800514221193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,balanced,1.5409386952718098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,balanced,2.9211839040120444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.01,0.42447361946105955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.01,0.23941121101379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.01,0.4373055934906006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.01,0.24564480781555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.01,0.4490687847137451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,balanced,0.6559199889500936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,power_law_1.01,0.08840960264205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.01,0.2643136024475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.01,0.4634431838989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.01,0.4650432109832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.01,0.2723520040512085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,balanced,0.8099520206451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,power_law_1.01,0.10190080404281616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.01,0.5001728057861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.01,0.2937727928161621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,power_law_1.01,0.1016319990158081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.01,0.5291264057159424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,balanced,2.2101546923319497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,balanced,0.9148853619893392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.01,0.31146240234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.01,0.540992021560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,power_law_1.01,0.12707200050354003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.01,0.3290623903274536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.01,0.6312320232391357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,power_law_1.01,0.15812480449676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.01,0.35145599842071534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,balanced,1.2785226504007976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.01,0.6676159858703613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.01,0.35998079776763914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,power_law_1.01,0.193503999710083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.01,0.7677631855010987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,balanced,3.725370724995931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.01,0.4086656093597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.01,0.8327168464660645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,power_law_1.01,0.25920639038085935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,balanced,1.5223414103190105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.01,1.010540771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.01,0.4502399921417236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,power_law_1.01,0.2704639911651611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.01,1.1671999931335448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.01,0.5403071880340576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.01,1.4676735877990723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,power_law_1.01,0.2818176031112671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,balanced,2.656346638997396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.01,0.5932928085327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.01,1.8565248489379882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,power_law_1.01,0.2870847940444946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,balanced,2.3530240058898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.01,0.7536128044128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.01,2.5622783660888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,power_law_1.01,0.30634241104125975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.01,0.888326358795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.01,3.3314048767089846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,power_law_1.01,0.3252351999282837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.01,1.252678394317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.01,4.132947158813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,power_law_1.01,0.34584319591522217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.01,1.597715187072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,balanced,2.9130614598592124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,power_law_1.01,0.37591679096221925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.01,6.918943786621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.01,2.191987228393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,power_law_1.01,0.3986560106277466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.01,2.954707145690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,power_law_1.01,0.43248639106750486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.01,13.118553161621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,power_law_1.01,0.5122816085815429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.01,3.499987030029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,balanced,3.3857971827189126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,balanced,5.5197709401448565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.01,5.525798416137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,balanced,4.29205862681071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,power_law_1.01,0.6199423789978027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.01,12.395404815673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,power_law_1.01,0.6566592216491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,power_law_1.01,0.8727807998657227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,2,power_law_1.2,0.0745024025440216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,power_law_1.01,1.018380832672119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,2,power_law_1.2,0.09824640154838563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,power_law_1.01,1.3654399871826173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,balanced,5.624714533487956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,2,power_law_1.2,0.08339840173721313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,power_law_1.01,1.8040319442749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,2,power_law_1.2,0.12461440563201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,power_law_1.01,2.586297607421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,2,power_law_1.2,0.17138559818267823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,power_law_1.01,3.2043071746826173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,2,power_law_1.2,0.2367232084274292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,balanced,5.100522677103679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,2,power_law_1.2,0.3665855884552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,power_law_1.01,4.958668899536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,2,power_law_1.2,0.38516480922698976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,power_law_1.01,6.496281433105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,2,power_law_1.2,0.39711999893188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,2,power_law_1.2,0.40921602249145506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,balanced,7.003018697102864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,power_law_1.01,7.571756744384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,2,power_law_1.2,0.44135680198669436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,2,power_law_1.2,0.44250879287719724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,power_law_1.01,11.81844482421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,2,power_law_1.2,0.45656957626342776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,2,power_law_1.2,0.47618560791015624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,2,power_law_1.2,0.5406208038330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,power_law_1.01,24.573152160644533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,2,power_law_1.2,0.5682496070861817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,2,power_law_1.2,0.5642240047454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,2,power_law_1.2,0.6317952156066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,2,power_law_1.2,0.6713088035583497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,balanced,10.804303487141928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,2,power_law_1.2,0.7700032234191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,2,power_law_1.2,0.8761856079101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,2,power_law_1.2,1.063225555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,balanced,11.095146179199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,2,power_law_1.2,1.1777024269104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,2,power_law_1.2,1.5114239692687987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,2,power_law_1.2,1.902400016784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,2,power_law_1.2,2.567020797729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,2,power_law_1.2,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,2,power_law_1.2,0.07155200242996215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,2,power_law_1.2,3.550886535644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,2,power_law_1.2,0.06539520025253295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,2,power_law_1.2,4.636569595336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,balanced,10.032288233439127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,2,power_law_1.2,0.08780800104141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,2,power_law_1.2,0.12616959810256959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,2,power_law_1.2,6.8646400451660154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,2,power_law_1.2,0.14890880584716798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,2,power_law_1.2,0.21242239475250244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,2,power_law_1.2,12.71778564453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,2,power_law_1.2,0.22410879135131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,2,power_law_1.2,0.23714559078216552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,2,power_law_1.2,0.24176640510559083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,2,power_law_1.2,0.2568511962890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,2,power_law_1.2,0.2796288013458252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,2,power_law_1.2,0.28767359256744385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,2,power_law_1.2,0.31310720443725587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,2,power_law_1.2,0.3374975919723511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,2,power_law_1.2,0.3639679908752441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,2,power_law_1.2,0.36681599617004396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,2,power_law_1.2,0.42513279914855956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,2,power_law_1.2,0.4598656177520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,2,power_law_1.2,0.5627200126647949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,2,power_law_1.2,0.608684778213501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,balanced,22.052932739257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,2,power_law_1.2,0.7600704193115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,2,power_law_1.2,0.924563217163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,2,power_law_1.2,1.2554431915283204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,2,power_law_1.2,1.5989055633544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,2,power_law_1.2,2.363180732727051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,2,power_law_1.2,2.8846271514892576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,2,power_law_1.2,3.768467330932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,2,power_law_1.2,6.504991912841797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,2,power_law_1.2,12.2836669921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,2,power_law_1.2,0.08760960102081299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,2,power_law_1.2,0.10304000377655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,2,power_law_1.2,0.09259520173072815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,2,power_law_1.2,0.11072640419006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,balanced,0.07851733267307281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,2,power_law_1.2,0.1479423999786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,balanced,0.07758933305740356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,2,power_law_1.2,0.17983360290527345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,balanced,0.10786133011182149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,balanced,0.16931732495625815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,2,power_law_1.2,0.24301440715789796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,balanced,0.29176000754038495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,2,power_law_1.2,0.26897919178009033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,balanced,0.5358560085296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,2,power_law_1.2,0.27645440101623536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,balanced,0.5432266791661581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,2,power_law_1.2,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,balanced,0.5424533287684122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,balanced,0.5451573530832926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,2,power_law_1.2,0.31769599914550783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,balanced,0.5487519900004069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,2,power_law_1.2,0.3243839979171753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,2,power_law_1.2,0.35951359272003175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,balanced,0.5477386713027954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,2,power_law_1.2,0.37553279399871825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,balanced,0.5559786558151245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,2,power_law_1.2,0.4165503978729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,balanced,0.5597759882609049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,balanced,0.5697866678237915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,2,power_law_1.2,0.4572415828704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,balanced,0.5826826492945353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,2,power_law_1.2,0.5365888118743897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,balanced,0.5908159812291464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,balanced,0.6141813198725382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,2,power_law_1.2,0.635103988647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,balanced,0.6850186983744303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,balanced,0.7579200267791748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,2,power_law_1.2,0.6855167865753173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,balanced,0.8747413158416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,2,power_law_1.2,0.9244159698486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,balanced,0.9940373102823893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,2,power_law_1.2,1.0890687942504882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,2,power_law_1.2,1.4397824287414551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,balanced,1.2811306317647297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,2,power_law_1.2,1.8437887191772462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,2,power_law_1.2,2.4735296249389647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,balanced,0.058058664202690125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,balanced,1.638485272725423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,2,power_law_1.2,3.375507354736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,balanced,0.06594133377075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,2,power_law_1.2,5.00843505859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,balanced,0.08608000477155049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,balanced,0.12770666678746542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,2,power_law_1.2,6.42899169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,balanced,0.20573866367340088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,balanced,2.4160639444986978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,balanced,0.3540693521499634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,2,power_law_1.2,7.977305603027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,balanced,0.35875733693440753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,balanced,0.3612266778945923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,balanced,0.1256106694539388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,balanced,0.36532799402872723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,2,power_law_1.2,13.480422973632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,balanced,0.1352000037829081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,balanced,0.36762134234110516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,balanced,2.8619467417399087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,balanced,0.1488533318042755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,balanced,0.3738613526026408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,balanced,0.19028266270955405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,balanced,0.37905065218607586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,2,power_law_1.2,24.302835083007814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,balanced,0.2782133420308431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,balanced,0.3861706654230754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,balanced,0.4190560181935628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,balanced,0.39606932799021405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,balanced,0.427130659421285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,balanced,0.4410826762517293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,balanced,0.41203200817108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,balanced,0.4468959967295329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,balanced,0.4206613302230835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,balanced,4.241039911905925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,balanced,0.45697065194447833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.07543039917945862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.05457280278205871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,balanced,0.4695039987564087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,balanced,0.45289067427317303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,balanced,0.4854880174001058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.07496320009231568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.06276479959487916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,balanced,0.5160319805145264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,balanced,0.5015733242034912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.07099519968032837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,balanced,0.5384320020675659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,balanced,0.5829226573308309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.10734080076217652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.14139519929885863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,balanced,0.5829226573308309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.14974080324172973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.2066879987716675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,balanced,0.6126879851023356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,balanced,0.6811199982961019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.2758016109466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.1903040051460266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,balanced,0.6613920132319132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,balanced,4.847407976786296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.26054399013519286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,balanced,0.7852053642272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.3852096080780029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.27825920581817626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.40378241539001464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.28602240085601804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,balanced,1.0665280024210613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.42856321334838865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.296012806892395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,balanced,0.8153226375579834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.42763519287109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.31765758991241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.33191680908203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.4535935878753662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,balanced,1.3466347058614094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.3538111925125122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.4688447952270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.01,0.3859647989273071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.4869503974914551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.01,0.4089216232299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.01,0.4339456081390381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.5073472023010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,balanced,6.218943913777669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,balanced,1.9086079597473145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.01,0.4488192081451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.5302783966064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,power_law_1.01,0.10970879793167114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,balanced,1.03439466158549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.01,0.5348351955413818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.5612864017486572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,power_law_1.01,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,0.5756288051605225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,balanced,1.3264959653218586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.5996479988098145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,power_law_1.01,0.13729920387268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,0.6952383995056153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.7155903816223145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,0.8034879684448242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,balanced,1.5177013079325359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,power_law_1.01,0.16732159852981568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,balanced,2.510848045349121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.7741504192352295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,1.032691192626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,power_law_1.01,0.21144320964813232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,1.2962944030761718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.9165439605712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,power_law_1.01,0.2531775951385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,balanced,2.2063093185424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,1.8028928756713867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,power_law_1.01,0.3280832052230835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.01,1.0570560455322267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,power_law_1.01,0.3513024091720581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,2.3370304107666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.01,1.3620415687561036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,balanced,2.674597422281901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,power_law_1.01,0.36465280055999755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.01,1.6754623413085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,3.3863616943359376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,balanced,3.725365320841471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,power_law_1.01,0.3756608009338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.01,2.3155071258544924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,4.315135955810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,power_law_1.01,0.4078335762023926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,power_law_1.01,0.42805118560791017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.01,2.731648063659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.07586560249328614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,balanced,4.138976097106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.01,5.433465576171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,power_law_1.01,0.45469441413879397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,balanced,9.266016006469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.01,3.8717952728271485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.07464960217475891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,power_law_1.01,0.5128767967224122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.01,8.023078155517577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,power_law_1.01,0.5747200012207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.01,4.962771224975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.1317247986793518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,power_law_1.01,0.6243584156036377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.18327679634094238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,balanced,5.139109293619792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.01,6.046732711791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.01,15.874514770507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,power_law_1.01,0.7210239887237548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,balanced,4.346218744913737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.37763841152191163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.01,8.797036743164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.3995520114898682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,power_law_1.01,0.8957311630249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.413375997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.01,17.037753295898437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.4311679840087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.01,1.0090815544128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,balanced,7.6431624094645185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.45781121253967283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.01,1.3338047981262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.48737921714782717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.01,1.653023910522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.4886591911315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,balanced,5.575530370076497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.01,2.2737600326538088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.5282112121582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.5338175773620606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.01,2.886675262451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.5696256160736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.01,4.129235076904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.6065408229827881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,balanced,10.164661407470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.01,5.356467056274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.736729621887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.7978752136230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.01,7.8189697265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.9387007713317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,1,power_law_1.2,1.0811903953552247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.01,10.209452819824218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,1,power_law_1.2,1.3759936332702636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,1,power_law_1.2,1.7252031326293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,1,power_law_1.2,2.364441680908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.01,12.671155548095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,1,power_law_1.2,2.7624576568603514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,1,power_law_1.2,3.9018688201904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,balanced,18.34427769978841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,balanced,12.734976450602213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,power_law_1.01,19.984690856933593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,1,power_law_1.2,5.130534362792969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,balanced,8.17029889424642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,1,power_law_1.2,6.437670135498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,1,power_law_1.2,8.810157012939452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,power_law_1.01,39.57144470214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,1,power_law_1.2,17.050367736816405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,balanced,20.00508753458659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,1,power_law_1.2,0.05375360250473023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,1,power_law_1.2,0.061312001943588254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,1,power_law_1.2,0.06940159797668458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,1,power_law_1.2,0.1009600043296814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,1,power_law_1.2,0.13462400436401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,1,power_law_1.2,0.17384320497512817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,1,power_law_1.2,0.253766393661499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,1,power_law_1.2,0.2726912021636963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,1,power_law_1.2,0.27888638973236085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,1,power_law_1.2,0.2991487979888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,1,power_law_1.2,0.317305588722229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,balanced,16.35208511352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,1,power_law_1.2,0.34362239837646485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,1,power_law_1.2,0.3600192070007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,1,power_law_1.2,0.3915839910507202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,1,power_law_1.2,0.42826237678527834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,1,power_law_1.2,0.4510528087615967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,1,power_law_1.2,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,1,power_law_1.2,0.5481791973114014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,1,power_law_1.2,0.6133759975433349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,1,power_law_1.2,0.7145343780517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,1,power_law_1.2,0.844979190826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,1,power_law_1.2,1.069638442993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,1,power_law_1.2,1.324441623687744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,1,power_law_1.2,1.8537343978881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,1,power_law_1.2,2.3930688858032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,balanced,39.81723276774088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,1,power_law_1.2,3.4863616943359377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,1,power_law_1.2,4.587136077880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,1,power_law_1.2,5.685811233520508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,1,power_law_1.2,8.016921234130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,1,power_law_1.2,15.744607543945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,balanced,0.02478400121132533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,balanced,0.024698667228221893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,balanced,0.026661333938439686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,balanced,0.032170665760835014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,balanced,0.05087466537952423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,1,power_law_1.2,0.11052160263061524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,balanced,0.0521066685517629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,1,power_law_1.2,0.1238592028617859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,balanced,0.05212800204753876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,balanced,0.0529013325770696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,1,power_law_1.2,0.1375808000564575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,balanced,0.05299200117588043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,1,power_law_1.2,0.15976959466934204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,balanced,0.05339199801286062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,balanced,0.05409599840641022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,1,power_law_1.2,0.1996351957321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,balanced,0.055248002211252846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,1,power_law_1.2,0.23802878856658935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,balanced,0.055402666330337524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,1,power_law_1.2,0.3236991882324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,balanced,0.05977066854635874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,balanced,0.06081066528956095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,1,power_law_1.2,0.35000319480895997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,balanced,0.06512533128261566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,1,power_law_1.2,0.3604095935821533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,balanced,0.0669653316338857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,1,power_law_1.2,0.38208000659942626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,balanced,0.06896000107129414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,1,power_law_1.2,0.4105984210968018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,balanced,0.07289066910743713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,1,power_law_1.2,0.4414656162261963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,1,power_law_1.2,0.46469759941101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,balanced,0.07884266475836436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,1,power_law_1.2,0.5261312007904053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,1,power_law_1.2,0.5824192047119141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,balanced,0.0918880005677541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,1,power_law_1.2,0.6346367835998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,1,power_law_1.2,0.7363200187683105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,balanced,0.09776533643404643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,balanced,0.03164800008138021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,1,power_law_1.2,0.9171008110046387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,balanced,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,balanced,0.1360213359196981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,balanced,0.03340800106525421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,balanced,0.03557866563399633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.2,1.0294272422790527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,balanced,0.03812266637881597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,power_law_1.01,0.04455040097236633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.2,1.3514431953430175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,balanced,0.03844266633192698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,balanced,0.15220800042152405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,power_law_1.01,0.02885119915008545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,balanced,0.0383146678407987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.2,1.6672704696655274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,balanced,0.02460266649723053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,power_law_1.01,0.030028799176216127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,balanced,0.03942933430274328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,power_law_1.01,0.03431679904460907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,balanced,0.024506665766239166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.2,2.2922176361083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,balanced,0.0388373335202535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,power_law_1.01,0.04090240001678467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,balanced,0.026127999027570088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.2,2.901247978210449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,balanced,0.029114666084448498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,power_law_1.01,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,balanced,0.03984000037113825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,balanced,0.030853333572546642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,balanced,0.20895467201868692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,power_law_1.01,0.04965119957923889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.2,4.1262977600097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,balanced,0.04049599915742874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,balanced,0.032416000962257385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,power_law_1.01,0.05195519924163818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,balanced,0.041696002086003624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.2,5.343020629882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,balanced,0.03421333432197571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,power_law_1.01,0.05297920107841492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,balanced,0.042778665820757546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,power_law_1.01,0.0541055977344513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.2,7.779122924804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,balanced,0.03383466601371765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,balanced,0.04629333317279816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,power_law_1.01,0.05452160239219665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,balanced,0.03436266630887985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,balanced,0.05162666738033295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,power_law_1.01,0.05637120008468628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.2,10.204704284667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,balanced,0.035274667044480644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,power_law_1.01,0.05800319910049438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,balanced,0.052282666166623436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,balanced,0.23971199989318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,balanced,0.03584533433119456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,power_law_1.01,0.4335040092468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.2,12.620185852050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,balanced,0.03711466739575068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,balanced,0.05384533107280731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,power_law_1.01,0.43764481544494627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,balanced,0.03963200002908707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,power_law_1.01,0.4436351776123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,power_law_1.01,0.04044800102710724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,balanced,0.05864533285299937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,1,power_law_1.2,19.902867126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,power_law_1.01,0.07203840017318726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,power_law_1.01,0.07563520073890687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,power_law_1.01,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,power_law_1.01,0.08313599824905396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,power_law_1.01,0.03342080116271973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,balanced,0.06306133170922597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,balanced,0.045925334095954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,power_law_1.01,0.09428480267524719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,power_law_1.01,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,balanced,0.04520533482233683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,power_law_1.01,0.11905920505523682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,1,power_law_1.2,39.444122314453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,power_law_1.01,0.03740800023078918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,balanced,0.06957866748174031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,balanced,0.2942453424135844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,power_law_1.01,0.14831360578536987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,power_law_1.01,0.038624000549316403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,power_law_1.01,0.16219520568847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,power_law_1.01,0.03873279988765717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,balanced,0.07752533257007599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,power_law_1.01,0.1956544041633606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,power_law_1.01,0.038649600744247434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,power_law_1.01,0.2810368061065674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,power_law_1.01,0.04193280041217804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,balanced,0.09155199925104777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,power_law_1.01,0.36401278972625734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,balanced,0.05137600004673004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,power_law_1.01,0.041920000314712526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,power_law_1.01,0.5097536087036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,balanced,0.05648533503214518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,power_law_1.01,0.044998401403427125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,power_law_1.01,0.6917119979858398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,power_law_1.01,0.04782080054283142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,balanced,0.05810666580994924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,balanced,0.10393066207567851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,power_law_1.01,0.050297600030899045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,power_law_1.01,0.9785216331481934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,power_law_1.01,0.05082880258560181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,power_law_1.01,1.9835647583007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,power_law_1.01,0.056966400146484374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,balanced,0.13965866963068643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,power_law_1.01,0.05913599729537964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,balanced,0.06942399839560191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,power_law_1.01,0.06059520244598389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,balanced,0.4426453510920207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,balanced,0.0738613357146581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,power_law_1.01,0.06581760048866273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,power_law_1.01,0.07780479788780212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,16,power_law_1.2,0.04475519955158234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,balanced,0.09532266855239868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,power_law_1.01,0.08967679738998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,balanced,0.1672746737798055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,16,power_law_1.2,0.02858240008354187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,power_law_1.01,0.10959359407424926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,16,power_law_1.2,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,power_law_1.01,0.13738240003585817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,balanced,0.10796800255775452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,power_law_1.01,0.147705602645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,16,power_law_1.2,0.03277440071105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,power_law_1.01,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,power_law_1.01,0.2232192039489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,16,power_law_1.2,0.040479999780654904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,power_law_1.01,0.026662400364875792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,balanced,0.14266666769981384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,power_law_1.01,0.26606719493865966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,balanced,0.23388799031575522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,16,power_law_1.2,0.04856959879398346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,power_law_1.01,0.026105600595474242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,power_law_1.01,0.39816319942474365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,16,power_law_1.2,0.04971520006656647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,power_law_1.01,0.028966400027275085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,power_law_1.01,0.030342400074005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,16,power_law_1.2,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,power_law_1.01,0.4513408184051514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,power_law_1.01,0.03298560082912445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,16,power_law_1.2,0.0542464017868042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,power_law_1.01,0.6668223857879638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,balanced,0.18092799186706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,power_law_1.01,0.03342080116271973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,16,power_law_1.2,0.05545600056648255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,power_law_1.01,0.9510208129882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,power_law_1.01,0.03426559865474701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,16,power_law_1.2,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,power_law_1.01,1.958195114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,16,power_law_1.2,0.05649920105934143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,balanced,0.28918399413426715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,power_law_1.01,0.04082559943199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,16,power_law_1.2,0.056959998607635495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,power_law_1.01,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,16,power_law_1.2,0.43540477752685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,power_law_1.01,0.04517120122909546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,16,power_law_1.2,0.44718079566955565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,power_law_1.01,0.04767360091209412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,16,power_law_1.2,0.44231038093566893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,power_law_1.01,0.05196800231933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,16,power_law_1.2,0.07265920042991639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,balanced,0.2760106722513835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,16,power_law_1.2,0.08600959777832032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,power_law_1.01,0.05596799850463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,16,power_law_1.2,0.08843520283699036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,balanced,0.842303991317749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,power_law_1.01,0.05779839754104614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,16,power_law_1.2,0.10535680055618286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,balanced,0.3585280179977417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,16,power_law_1.2,0.13680000305175782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,power_law_1.01,0.059545600414276124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,16,power_law_1.2,0.2018752098083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,power_law_1.01,0.07428479790687562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,balanced,0.362554669380188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,16,power_law_1.2,0.16605440378189087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,16,power_law_1.2,0.26119680404663087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,power_law_1.01,0.07982079982757569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,16,power_law_1.2,0.3390399932861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,power_law_1.01,0.09165440201759338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,16,power_law_1.2,0.551200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,power_law_1.01,0.1168063998222351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,16,power_law_1.2,0.6601727962493896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,power_law_1.01,0.15845119953155518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,16,power_law_1.2,0.841766357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,power_law_1.01,0.18360960483551025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,16,power_law_1.2,1.5612799644470214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,power_law_1.01,0.3064896106719971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,balanced,0.45415465037027997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,power_law_1.01,0.350598406791687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,16,power_law_1.2,4.009036636352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,power_law_1.01,0.5983551979064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,balanced,0.5478080113728842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,power_law_1.01,0.8714688301086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,power_law_1.01,0.9895551681518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,power_law_1.01,1.5324735641479492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,power_law_1.01,2.7280767440795897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,balanced,0.7088960011800131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,16,power_law_1.2,0.041331198811531064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,16,power_law_1.2,0.03495680093765259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,16,power_law_1.2,0.03378559947013855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,16,power_law_1.2,0.03586559891700745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,16,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,16,power_law_1.2,0.0383103996515274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,balanced,1.0279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,16,power_law_1.2,0.03893119990825653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,16,power_law_1.2,0.04020479917526245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,16,power_law_1.2,0.04327679872512817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,16,power_law_1.2,0.04467200040817261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,16,power_law_1.2,0.04888319969177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,16,power_law_1.2,0.04892799854278564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,16,power_law_1.2,0.05130239725112915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,16,power_law_1.2,0.051571202278137204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,16,power_law_1.2,0.05639680027961731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,balanced,1.3900426228841145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,16,power_law_1.2,0.061478400230407716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,16,power_law_1.2,0.030048000812530517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,16,power_law_1.2,0.06484479904174804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,16,power_law_1.2,0.07006080150604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,16,power_law_1.2,0.025791999697685242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,16,power_law_1.2,0.077920001745224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,16,power_law_1.2,0.026943999528884887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,16,power_law_1.2,0.029267200827598573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,16,power_law_1.2,0.09902080297470092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,16,power_law_1.2,0.030124801397323608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,16,power_law_1.2,0.1263167977333069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,16,power_law_1.2,0.03372159898281098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,16,power_law_1.2,0.033958399295806886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,16,power_law_1.2,0.15203839540481567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,16,power_law_1.2,0.034892800450325015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,16,power_law_1.2,0.03834240138530731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,16,power_law_1.2,0.18997119665145873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,16,power_law_1.2,0.040057599544525146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,16,power_law_1.2,0.2541759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,16,power_law_1.2,0.04534400105476379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,16,power_law_1.2,0.04630399942398071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,16,power_law_1.2,0.31598079204559326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,16,power_law_1.2,0.048607999086380006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,16,power_law_1.2,0.48772478103637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,16,power_law_1.2,0.050918400287628174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,16,power_law_1.2,0.6708352088928222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,balanced,0.023344000180562336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,16,power_law_1.2,0.8597503662109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,balanced,0.02329600105683009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,16,power_law_1.2,0.060140800476074216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,balanced,0.02513066679239273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,16,power_law_1.2,1.3707327842712402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,balanced,0.031184000273545582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,16,power_law_1.2,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,balanced,0.04632533093293508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,16,power_law_1.2,3.4014015197753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,balanced,0.04729066789150238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,16,power_law_1.2,0.06304640173912049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,balanced,0.04807466765244802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,balanced,0.04770133395989736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,16,power_law_1.2,0.07296640276908875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,balanced,0.04831466575463613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,16,power_law_1.2,0.09170560240745544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,balanced,0.03164800008138021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,balanced,0.04845866560935974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,16,power_law_1.2,0.11060479879379273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,balanced,0.03146666785081228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,balanced,0.048986668388048805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,balanced,0.037045332292715706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,16,power_law_1.2,0.12970880270004273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,balanced,0.049866666396458946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,balanced,0.05090666810671488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,balanced,0.0349440003434817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,16,power_law_1.2,0.2090751886367798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,balanced,0.03962666789690653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,balanced,0.05113600194454193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,16,power_law_1.2,0.22846078872680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,balanced,0.039621333281199135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,16,power_law_1.2,0.31573760509490967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,balanced,0.05570666491985321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,balanced,0.04049599915742874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,16,power_law_1.2,0.49395198822021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,balanced,0.05589333176612854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,balanced,0.04020266731580099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,balanced,0.039808000127474465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,balanced,0.06609066824118297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,16,power_law_1.2,0.8471360206604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,balanced,0.03999999910593033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,balanced,0.04248000184694926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,balanced,0.07018133501211803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,16,power_law_1.2,1.1805760383605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,balanced,0.043194666504859924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,balanced,0.04264000058174133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,balanced,0.07367999851703644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,16,power_law_1.2,1.4074048042297362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,balanced,0.044853334625562034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,16,power_law_1.2,2.5744512557983397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,balanced,0.05152533451716105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,balanced,0.07915733257929485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,balanced,0.05365333457787832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,16,power_law_1.2,4.616857528686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,balanced,0.05608533322811127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,balanced,0.08851200342178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,balanced,0.06115733087062836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,balanced,0.10475200414657593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,balanced,0.06810666620731354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,balanced,0.07684266567230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,balanced,0.11245866616566975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,balanced,0.025786665578683216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,balanced,0.08805867036183675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,balanced,0.026741333305835724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,balanced,0.02736533433198929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,power_law_1.01,0.030739200115203858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,balanced,0.10590400298436482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,balanced,0.15945067008336386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,balanced,0.030794667700926464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,power_law_1.01,0.030880001187324525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,balanced,0.03730133424202601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,power_law_1.01,0.02800000011920929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,balanced,0.12010133266448975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,balanced,0.03730666637420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,power_law_1.01,0.03249920010566711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,balanced,0.03685333331425985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,power_law_1.01,0.03624320030212402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,balanced,0.18721065918604532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,balanced,0.03807466725508372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,power_law_1.01,0.047705599665641786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,balanced,0.03916800022125244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,balanced,0.1660373310248057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,power_law_1.01,0.0474047988653183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,balanced,0.039333333571751915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,power_law_1.01,0.047712001204490664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,balanced,0.04201066493988037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,power_law_1.01,0.04938879907131195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,power_law_1.01,0.049670401215553286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,balanced,0.04238933324813843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,power_law_1.01,0.051475197076797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,balanced,0.2611626585324605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,balanced,0.20786666870117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,balanced,0.04500266909599304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,power_law_1.01,0.05292159914970398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,power_law_1.01,0.05492479801177978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,power_law_1.01,0.4394688129425049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,power_law_1.01,0.43775358200073244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,balanced,0.05162133276462555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,power_law_1.01,0.4378496170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,balanced,0.051925331354141235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,balanced,0.29941866795221966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,power_law_1.01,0.07319679856300354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,balanced,0.31573333342870075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,power_law_1.01,0.08056960105895997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,power_law_1.01,0.08960000276565552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,power_law_1.01,0.09763200283050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,power_law_1.01,0.1154047966003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,power_law_1.01,0.15738240480422974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,power_law_1.01,0.03632639944553375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,balanced,0.05778133372465769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,power_law_1.01,0.16189440488815307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,power_law_1.01,0.032364800572395325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,power_law_1.01,0.20809600353240967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,balanced,0.06596266726652782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,balanced,0.3797760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,power_law_1.01,0.03036159873008728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,power_law_1.01,0.2661823987960815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,power_law_1.01,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,balanced,0.06735999882221222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,balanced,0.39737598101298016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,power_law_1.01,0.037913599610328676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,power_law_1.01,0.4142399787902832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,power_law_1.01,0.040031999349594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,power_law_1.01,0.5055615901947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,power_law_1.01,0.04017280042171478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,power_law_1.01,0.040320000052452086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,power_law_1.01,0.634009599685669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,power_law_1.01,0.04182400107383728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,balanced,0.0842026670773824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,power_law_1.01,1.112070369720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,power_law_1.01,0.04392319917678833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,power_law_1.01,0.04498560130596161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,balanced,0.09290132919947307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,power_law_1.01,0.029344001412391664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,power_law_1.01,2.091116714477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,power_law_1.01,0.047116801142692566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,power_law_1.01,0.05220479965209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,power_law_1.01,0.028966400027275085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,balanced,0.4766453504562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,power_law_1.01,0.050335997343063356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,balanced,0.12290133039156596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,power_law_1.01,0.027379199862480164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,power_law_1.01,0.0568448007106781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,power_law_1.01,0.03223040103912354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,power_law_1.01,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,power_law_1.01,0.06468480229377746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,balanced,0.14545067151387533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,power_law_1.01,0.03434880077838898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,power_law_1.01,0.07374719977378845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,power_law_1.01,0.03707520067691803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,power_law_1.01,0.08147199749946595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,power_law_1.01,0.037503999471664426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,power_law_1.01,0.09433599710464477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,power_law_1.01,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,balanced,0.21708800395329794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,balanced,0.5816479921340942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,power_law_1.01,0.11679359674453735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,power_law_1.01,0.13955199718475342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,power_law_1.01,0.040089601278305055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,power_law_1.01,0.18195199966430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,power_law_1.01,0.04179840087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,power_law_1.01,0.2092736005783081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,power_law_1.01,0.044249600172042845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,power_law_1.01,0.2811647891998291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,power_law_1.01,0.04668799936771393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,balanced,0.2885813315709432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,power_law_1.01,0.3960767984390259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,power_law_1.01,0.05136640071868896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,power_law_1.01,0.5547008037567138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,power_law_1.01,0.05568000078201294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,power_law_1.01,0.7126336097717285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,power_law_1.01,1.0134655952453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,balanced,0.7376586596171061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,power_law_1.01,0.05983999967575073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,power_law_1.01,2.1689855575561525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,power_law_1.01,0.0627135992050171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,balanced,0.4169973134994507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,8,power_law_1.2,0.030687999725341798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,power_law_1.01,0.06493440270423889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,8,power_law_1.2,0.02624639868736267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,power_law_1.01,0.08206719756126404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,8,power_law_1.2,0.02736639976501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,power_law_1.01,0.08628479838371277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,8,power_law_1.2,0.031564798951148984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,8,power_law_1.2,0.03319680094718933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,power_law_1.01,0.10682879686355591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,balanced,0.5400266647338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,power_law_1.01,0.1285696029663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,8,power_law_1.2,0.04479359984397888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,power_law_1.01,0.1752575993537903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,8,power_law_1.2,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,power_law_1.01,0.24316799640655518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,8,power_law_1.2,0.04849919974803925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,power_law_1.01,0.33393919467926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,8,power_law_1.2,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,power_law_1.01,0.4838848114013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,8,power_law_1.2,0.050195199251174924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,power_law_1.01,0.7137983798980713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,8,power_law_1.2,0.054124802350997925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,power_law_1.01,0.9013824462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,8,power_law_1.2,0.05496960282325745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,power_law_1.01,1.0651519775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,balanced,1.1380480130513508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,8,power_law_1.2,0.05512319803237915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,balanced,0.6770186424255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,8,power_law_1.2,0.03573760092258453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,8,power_law_1.2,0.43783040046691896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,power_law_1.01,1.9536191940307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,8,power_law_1.2,0.03212159872055054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,8,power_law_1.2,0.4408576011657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,power_law_1.01,3.4847232818603517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,8,power_law_1.2,0.03108479976654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,8,power_law_1.2,0.4403007984161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,8,power_law_1.2,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,8,power_law_1.2,0.07560960054397584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,8,power_law_1.2,0.03663359880447388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,8,power_law_1.2,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,8,power_law_1.2,0.039673599600791934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,8,power_law_1.2,0.09159039855003356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,8,power_law_1.2,0.040243199467658995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,8,power_law_1.2,0.10252159833908081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,8,power_law_1.2,0.04190079867839813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,balanced,1.3821600278218586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,8,power_law_1.2,0.12395520210266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,8,power_law_1.2,0.04259200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,8,power_law_1.2,0.04433920085430145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,8,power_law_1.2,0.15559680461883546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,8,power_law_1.2,0.049292799830436704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,8,power_law_1.2,0.1614527940750122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,8,power_law_1.2,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,8,power_law_1.2,0.05311359763145447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,balanced,1.0566720167795818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,8,power_law_1.2,0.2794431924819946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,8,power_law_1.2,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,8,power_law_1.2,0.06035839915275574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,8,power_law_1.2,0.32856318950653074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,8,power_law_1.2,0.06000000238418579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,8,power_law_1.2,0.06572160124778748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,8,power_law_1.2,0.4376383781433105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,8,power_law_1.2,0.07400320172309875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,8,power_law_1.2,0.6349631786346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,8,power_law_1.2,0.08427519798278808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,8,power_law_1.2,0.8286911964416503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,8,power_law_1.2,0.10222079753875732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,8,power_law_1.2,0.12730239629745482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,8,power_law_1.2,1.442240047454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,8,power_law_1.2,0.16106879711151123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,8,power_law_1.2,0.1768704056739807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,8,power_law_1.2,2.839276885986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,8,power_law_1.2,0.2850368022918701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,8,power_law_1.2,0.2900160074234009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,8,power_law_1.2,0.5335296154022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,8,power_law_1.2,0.6799551963806152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,8,power_law_1.2,0.8999872207641602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,8,power_law_1.2,1.452409553527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,8,power_law_1.2,3.4004543304443358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,balanced,2.0697813034057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,8,power_law_1.2,0.028832000494003297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,8,power_law_1.2,0.02768000066280365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,8,power_law_1.2,0.02794879972934723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,8,power_law_1.2,0.030707201361656188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,8,power_law_1.2,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,8,power_law_1.2,0.038227200508117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,8,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,8,power_law_1.2,0.04051840007305145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,8,power_law_1.2,0.039904001355171206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,8,power_law_1.2,0.044512000679969785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,8,power_law_1.2,0.04644480049610138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,8,power_law_1.2,0.0487744003534317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,8,power_law_1.2,0.05183359980583191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,8,power_law_1.2,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,balanced,0.02362666775782903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,8,power_law_1.2,0.06183040142059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,balanced,0.023631999890009563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,8,power_law_1.2,0.06344959735870362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,balanced,0.026170666019121807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,balanced,0.03179199993610382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,balanced,0.04911466439565023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,8,power_law_1.2,0.06691200137138367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,balanced,0.050016000866889954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,8,power_law_1.2,0.08112000226974488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,balanced,0.05003733436266581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,8,power_law_1.2,0.10403200387954711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,balanced,0.051183998584747314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,balanced,0.05107733110586802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,8,power_law_1.2,0.1180799961090088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,balanced,0.05115733544031779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,8,power_law_1.2,0.14209920167922974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,balanced,0.05232533315817515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,8,power_law_1.2,0.19946880340576173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,8,power_law_1.2,0.284172797203064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,balanced,0.0547680010398229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,8,power_law_1.2,0.4000383853912354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,8,power_law_1.2,0.5806272029876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,balanced,0.05940799911816915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,8,power_law_1.2,0.7777215957641601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,balanced,0.060602664947509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,balanced,0.03186133255561193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,8,power_law_1.2,1.2348223686218263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,balanced,0.06342400113741557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,balanced,0.03141866624355316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,balanced,0.07092266778151195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,8,power_law_1.2,1.5232319831848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,balanced,0.032501332461833954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,balanced,0.08063466846942902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,8,power_law_1.2,2.3421951293945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,balanced,0.037274666130542755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,balanced,0.04297600189844767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,balanced,0.10179733236630757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,balanced,0.04236799975236257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,8,power_law_1.2,5.663980865478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,balanced,0.04457599918047587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,balanced,0.09941333532333374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,balanced,0.044693330923716225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,balanced,0.044256001710891724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,power_law_1.01,0.02714880108833313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,balanced,0.13829867045084634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,power_law_1.01,0.025971201062202454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,balanced,0.04365866879622141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,power_law_1.01,0.02707200050354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,balanced,0.04500266909599304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,power_law_1.01,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,balanced,0.04765866696834564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,balanced,0.14853866895039877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,power_law_1.01,0.03804160058498383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,balanced,0.04911466439565023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,power_law_1.01,0.047065600752830505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,balanced,0.03044266750415166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,balanced,0.05212266743183136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,power_law_1.01,0.04945279955863953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,power_law_1.01,0.04987519979476929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,balanced,0.031541332602500916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,balanced,0.20592532555262247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,balanced,0.05840000013510386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,power_law_1.01,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,balanced,0.03215999901294708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,power_law_1.01,0.05175679922103882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,balanced,0.05951466659704844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,balanced,0.035717333356539406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,power_law_1.01,0.0543936014175415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,balanced,0.04165866722663244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,balanced,0.06445333361625671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,power_law_1.01,0.05839999914169312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,balanced,0.042768001556396484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,power_law_1.01,0.05860480070114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,balanced,0.043663998444875084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,balanced,0.07131200035413106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,balanced,0.2674186627070109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,power_law_1.01,0.43485441207885744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,balanced,0.043605332573254905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,power_law_1.01,0.4392064094543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,balanced,0.04524266719818115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,balanced,0.07703466713428497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,power_law_1.01,0.44405760765075686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,balanced,0.04513066510359446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,power_law_1.01,0.44190077781677245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,balanced,0.04706133405367533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,power_law_1.01,0.03491199910640717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,balanced,0.0904906690120697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,balanced,0.05017066498597463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,power_law_1.01,0.44983677864074706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,power_law_1.01,0.030329599976539612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,power_law_1.01,0.0963648021221161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,balanced,0.10175466537475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,balanced,0.05475200215975443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,power_law_1.01,0.03223679959774017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,balanced,0.3885226647059123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,power_law_1.01,0.11272959709167481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,power_law_1.01,0.03617280125617981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,power_law_1.01,0.039577600359916684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,balanced,0.13436800241470337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,power_law_1.01,0.13071999549865723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,power_law_1.01,0.04359680116176605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,power_law_1.01,0.15438719987869262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,balanced,0.06304533282915752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,power_law_1.01,0.04447999894618988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,balanced,0.15870933731396994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,power_law_1.01,0.04410240054130554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,balanced,0.0639466643333435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,power_law_1.01,0.18232959508895874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,power_law_1.01,0.044787201285362246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,power_law_1.01,0.232857608795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,power_law_1.01,0.04522239863872528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,power_law_1.01,0.047065600752830505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,balanced,0.4919626712799072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,power_law_1.01,0.031302401423454286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,power_law_1.01,0.3440000057220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,balanced,0.21970667441685995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,power_law_1.01,0.05555199980735779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,power_law_1.01,0.4919487953186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,power_law_1.01,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,balanced,0.07193066676457723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,4,power_law_1.2,0.02640640139579773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,power_law_1.01,0.03227519989013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,power_law_1.01,0.06116480231285095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,power_law_1.01,0.638969612121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,power_law_1.01,0.06645119786262513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,power_law_1.01,0.0377920001745224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,4,power_law_1.2,0.02396800071001053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,balanced,0.08555733164151509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,power_law_1.01,0.06869120001792908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,power_law_1.01,0.7477824211120605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,balanced,0.2873813311258952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,power_law_1.01,0.03923200070858002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,4,power_law_1.2,0.027628800272941588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,power_law_1.01,0.08387839794158936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,power_law_1.01,0.04360319972038269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,4,power_law_1.2,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,power_law_1.01,1.350483226776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,power_law_1.01,0.09102079868316651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,balanced,0.08948266506195068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,power_law_1.01,0.044435200095176694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,power_law_1.01,0.10685440301895141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,4,power_law_1.2,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,power_law_1.01,0.04601599872112274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,power_law_1.01,0.12597119808197021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,power_law_1.01,2.5447935104370116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,4,power_law_1.2,0.048172798752784726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,power_law_1.01,0.16186879873275756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,balanced,0.6264426708221436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,power_law_1.01,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,4,power_law_1.2,0.04917759895324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,power_law_1.01,0.21568639278411866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,power_law_1.01,0.04888960123062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,power_law_1.01,0.28743040561676025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,4,power_law_1.2,0.05132799744606018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,balanced,0.4533439874649048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,power_law_1.01,0.05116159915924072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,balanced,0.11440533399581909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,power_law_1.01,0.35291519165039065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,4,power_law_1.2,0.05268480181694031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,power_law_1.01,0.055206400156021115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,power_law_1.01,0.5088575839996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,4,power_law_1.2,0.051948797702789304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,power_law_1.01,0.0592960000038147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,power_law_1.01,0.6706240177154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,4,power_law_1.2,0.05804799795150757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,balanced,0.12873599926630655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,power_law_1.01,0.06563199758529663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,4,power_law_1.2,0.13741439580917358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,power_law_1.01,0.9559359550476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,4,power_law_1.2,0.36491520404815675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,power_law_1.01,1.352684783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,4,power_law_1.2,0.44142718315124513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,balanced,0.19822933276494345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,power_law_1.01,0.07193599939346314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,power_law_1.01,2.813235282897949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,4,power_law_1.2,0.4451136112213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,balanced,0.5880106687545776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,power_law_1.01,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,4,power_law_1.2,0.44854397773742677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,4,power_law_1.2,0.4472959995269775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,balanced,0.2529813249905904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,4,power_law_1.2,0.45957121849060056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,power_law_1.01,0.08173440098762512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,4,power_law_1.2,0.10263680219650269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,balanced,0.9596906503041586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,power_law_1.01,0.09575679898262024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,4,power_law_1.2,0.13050240278244019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,balanced,0.3591359853744507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,power_law_1.01,0.11098239421844483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,4,power_law_1.2,0.14108799695968627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,4,power_law_1.2,0.1692479968070984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,power_law_1.01,0.13371520042419432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,4,power_law_1.2,0.19363839626312257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,power_law_1.01,0.1708672046661377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,balanced,0.7373812993367513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,4,power_law_1.2,0.29948160648345945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,4,power_law_1.2,0.37560319900512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,power_law_1.01,0.24705278873443604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,balanced,0.4651413361231486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,4,power_law_1.2,0.5556096076965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,power_law_1.01,0.3428607940673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,power_law_1.01,0.4850304126739502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,4,power_law_1.2,0.6699264049530029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,power_law_1.01,0.5898496150970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,4,power_law_1.2,0.9620991706848144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,power_law_1.01,0.9071040153503418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,4,power_law_1.2,1.446560001373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,balanced,0.6859359741210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,power_law_1.01,1.2659008026123046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,power_law_1.2,3.408230209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,power_law_1.01,1.513651180267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,power_law_1.01,2.5048896789550783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,power_law_1.01,4.555347061157226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,balanced,1.1618080139160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,balanced,0.8969013690948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,4,balanced,1.7610774040222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,4,power_law_1.2,0.03386879861354828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,4,power_law_1.2,0.030118399858474733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,4,power_law_1.2,0.03144960105419159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,balanced,1.1205493609110515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,4,power_law_1.2,0.034483200311660765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,4,power_law_1.2,0.03678719997406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,4,power_law_1.2,0.04266240000724793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,4,power_law_1.2,0.04366720020771027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,4,power_law_1.2,0.04374400079250336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,4,power_law_1.2,0.04508160054683685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,4,power_law_1.2,0.04700160026550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,4,power_law_1.2,0.04938879907131195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,4,power_law_1.2,0.05226879715919495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,4,power_law_1.2,0.05583999752998352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,4,power_law_1.2,0.05594879984855652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,4,power_law_1.2,0.06542720198631287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,balanced,1.7663572629292805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,4,power_law_1.2,0.06759679913520814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,4,power_law_1.2,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,balanced,2.1426080067952475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,4,power_law_1.2,0.08776959776878357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,4,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,4,power_law_1.2,0.1119871973991394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,4,power_law_1.2,0.13608319759368898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,4,power_law_1.2,0.16788480281829835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,4,power_law_1.2,0.20536959171295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,4,power_law_1.2,0.29777278900146487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,4,power_law_1.2,0.39613440036773684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,4,power_law_1.2,0.6810175895690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,4,power_law_1.2,0.8749823570251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,4,power_law_1.2,1.1644160270690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,4,power_law_1.2,1.612985610961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,4,power_law_1.2,3.616486358642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,4,power_law_1.2,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,4,power_law_1.2,0.030847999453544616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,4,power_law_1.2,0.0324864000082016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,4,power_law_1.2,0.03683840036392212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,4,power_law_1.2,0.038790398836135866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,balanced,3.473818778991699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,4,power_law_1.2,0.04387840032577515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,balanced,0.048858667413393654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,4,power_law_1.2,0.044300800561904906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,balanced,0.0425546665986379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,4,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,balanced,0.05366933345794678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,4,power_law_1.2,0.046374401450157164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,balanced,0.0767146646976471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,4,power_law_1.2,0.04963839948177338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,balanced,0.12771200140317282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,4,power_law_1.2,0.05616000294685364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,balanced,0.12854400277137756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,4,power_law_1.2,0.05863680243492127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,balanced,0.12929600477218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,4,power_law_1.2,0.057843202352523805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,4,power_law_1.2,0.06575999855995178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,balanced,0.12820266683896384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,balanced,0.1283626655737559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,balanced,0.12869333227475485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,4,power_law_1.2,0.07319039702415467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,balanced,0.12905599673589072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,balanced,0.13109333316485086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,4,power_law_1.2,0.07923200130462646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,balanced,0.1314826707045237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,balanced,0.1325920025507609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,4,power_law_1.2,0.0840448021888733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,balanced,0.1383840044339498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,balanced,0.1432266632715861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,4,power_law_1.2,0.09901440143585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,balanced,0.04182933270931244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,balanced,0.14573333660761514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,4,power_law_1.2,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,balanced,0.03814399987459183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,balanced,0.1495413382848104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,4,power_law_1.2,0.13605120182037353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,balanced,0.03968533376852671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,balanced,0.15756799777348837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,4,power_law_1.2,0.19259519577026368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,balanced,0.05871999760468801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,balanced,0.08360000451405843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,4,power_law_1.2,0.28441600799560546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,balanced,0.16802666584650675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,balanced,0.08501332998275757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,4,power_law_1.2,0.3509119987487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,balanced,0.08550399541854858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,4,power_law_1.2,0.5525184154510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,balanced,0.18042665719985962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,balanced,0.08692800005276997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,4,power_law_1.2,0.6640511989593506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,balanced,0.08681600292523702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,4,power_law_1.2,1.1182208061218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,balanced,0.21492799123128256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,balanced,0.08758399883906047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,4,power_law_1.2,1.3113344192504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,balanced,0.08801066875457764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,4,power_law_1.2,1.901420783996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,balanced,0.08828266461690266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,balanced,0.22395733992258707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,balanced,0.09019733468691508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,4,power_law_1.2,2.7578815460205077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,balanced,0.0913813312848409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,4,power_law_1.2,5.930329513549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,balanced,0.09648533662160237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.12260479927062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,balanced,0.09637866417566936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.05310720205307007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,balanced,0.29389333724975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,balanced,0.10072533289591472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,balanced,0.03014400104681651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.067084801197052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,balanced,0.10744000474611919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.07895680069923401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,balanced,0.029968000948429108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.09210879802703857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,balanced,0.03364799916744232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,balanced,0.11603200435638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,balanced,0.3222879966100057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,balanced,0.05442133545875549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.1274880051612854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,balanced,0.07755733529726665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,balanced,0.12822932998339334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.1130687952041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,balanced,0.07898133496443431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.12456320524215699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,balanced,0.14075733224550882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,balanced,0.08003733555475871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.1271232008934021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,balanced,0.07976533472537994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,balanced,0.0806879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.12855679988861085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,balanced,0.16922666629155478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,balanced,0.08210133512814839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,balanced,0.472762664159139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.12814719676971437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,balanced,0.08244266609350841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.132806396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,balanced,0.08329600095748901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.13537280559539794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,balanced,0.19538666804631552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,balanced,0.08475733796755473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.1354367971420288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,balanced,0.08627733588218689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.15083520412445067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.16442240476608277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,balanced,0.25970667600631714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.15107840299606323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,balanced,0.578874667485555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.17864960432052612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,balanced,0.09244267145792644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.20330240726470947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.224236798286438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,balanced,0.09289600451787312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,balanced,0.31354133288065594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.2644351959228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.01,0.3153215885162354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.01,0.3971647977828979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.08369920253753663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.01,0.5058623790740967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.04992640018463135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.01,0.6440000057220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.05121920108795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.01,1.0928895950317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,balanced,0.45396268367767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.06391040086746216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,balanced,0.7316160202026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.06638720035552978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.01,1.2442239761352538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,balanced,0.09830400347709656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.07882239818572997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.01,1.6869440078735352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,balanced,0.10658666491508484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.08371840119361877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.08357120156288148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,balanced,0.11120532949765523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.01,2.611903953552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.08751999735832214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.08604159951210022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.01,4.670233535766601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.08615679740905761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,balanced,0.5602399905522665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.09315840005874634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,balanced,0.1300106644630432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.09738879799842834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.09468799829483032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,balanced,0.14083733161290488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.09829760193824769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.10932480096817017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,balanced,0.18337599436442056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.11043839454650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.12801920175552367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,balanced,1.0982293287913005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,power_law_1.01,0.07694720029830933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.14510719776153563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,balanced,0.21098132928212485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,power_law_1.01,0.04742400050163269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.16095999479293824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,balanced,0.696021318435669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,power_law_1.01,0.039084801077842714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.22410240173339843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,power_law_1.01,0.05598719716072083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,power_law_1.01,0.062489598989486694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.31795198917388917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,power_law_1.01,0.07535359859466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.32835841178894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,power_law_1.01,0.07461760044097901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.055289602279663085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,0.43831682205200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,power_law_1.01,0.08112000226974488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,power_law_1.01,0.08161919713020324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,0.5832128047943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,balanced,0.3153546651204427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,power_law_1.01,0.08597760200500489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.06788480281829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,0.8328960418701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,power_law_1.01,0.08810880184173583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.09325439929962158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,power_law_1.01,0.0906175971031189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,0.9203392028808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,power_law_1.01,0.1004032015800476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.11117440462112427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,power_law_1.01,0.10882560014724732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.01,1.2753408432006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.1186560034751892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,balanced,0.40116798877716064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.12038400173187255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.01,2.2542463302612306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,power_law_1.01,0.10805759429931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.12768640518188476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,power_law_1.01,0.1181056022644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.13055360317230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.01,4.0700927734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.13178240060806273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,balanced,1.0809439818064372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.13820799589157104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,power_law_1.01,0.11304960250854493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.14391679763793946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,power_law_1.01,0.14612480401992797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,balanced,0.5943359931310018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.01,0.16948479413986206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.13401600122451782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.150271999835968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.01,0.18272000551223755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.16149760484695436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.01,0.24184319972991944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.01,0.3391551971435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.16621439456939696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.01,0.5305088043212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.20076799392700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.21293439865112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.01,0.6600319862365722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,balanced,0.7898773352305094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.25552000999450686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.01,1.0525888442993163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,16,power_law_1.2,0.34144001007080077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.01,1.316262435913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,balanced,2.13482666015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,16,power_law_1.2,0.4251455783843994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.01,1.71331844329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,16,power_law_1.2,0.4902207851409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,power_law_1.01,2.281888008117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,16,power_law_1.2,0.6774400234222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,16,power_law_1.2,0.866643238067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,power_law_1.01,4.312550354003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,16,power_law_1.2,1.498579216003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,16,power_law_1.2,1.9449087142944337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,power_law_1.01,6.86429443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,16,power_law_1.2,2.3177536010742186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,balanced,0.9811519781748453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,16,power_law_1.2,4.193356704711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.046105599403381346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,16,power_law_1.2,7.815058898925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.05704960227012634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.06452479958534241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.07921280264854431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.08584960103034973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,balanced,2.0996267000834146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.08657919764518737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.08524799942970276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.08782079815864563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.09511039853096008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.10054399967193603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.09893760085105896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.11119999885559081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,balanced,1.5522720019022624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.11618560552597046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.13872640132904052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.15786880254745483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.18808319568634033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.2575040102005005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.36533119678497317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.41292800903320315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,0.5147712230682373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,0.7126463890075684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,1.0386879920959473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,1.6546943664550782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,16,power_law_1.2,1.9517440795898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,16,power_law_1.2,2.7973440170288084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,16,power_law_1.2,6.106592178344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,16,power_law_1.2,0.07753599882125854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,16,power_law_1.2,0.04917120039463043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,16,power_law_1.2,0.04083200097084046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,16,power_law_1.2,0.05322880148887634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,16,power_law_1.2,0.06119040250778198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,16,power_law_1.2,0.07563520073890687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,16,power_law_1.2,0.0781823992729187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,balanced,3.048778533935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,16,power_law_1.2,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,16,power_law_1.2,0.0834496021270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,16,power_law_1.2,0.0832256019115448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,16,power_law_1.2,0.088755202293396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,16,power_law_1.2,0.09241600036621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,16,power_law_1.2,0.10025600194931031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,16,power_law_1.2,0.10771839618682862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,16,power_law_1.2,0.11455359458923339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,16,power_law_1.2,0.12492159605026246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,balanced,0.03989866624275843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,16,power_law_1.2,0.1322368025779724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,balanced,0.03913066784540812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,16,power_law_1.2,0.1460927963256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.2,0.19154560565948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,balanced,0.05313600103060404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,balanced,0.07365333537260692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.2,0.2564160108566284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,balanced,0.130021333694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.2,0.34123520851135253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,balanced,0.12843199570973715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.2,0.38321919441223146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,balanced,0.1297546625137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.2,0.5795199871063232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,balanced,0.12877866625785828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,balanced,0.12845866878827414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.2,0.8384127616882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,balanced,0.1293280025323232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.2,1.2154303550720216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,balanced,0.13106133540471396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.2,2.0976703643798826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,balanced,0.13168533643086752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.2,2.2603839874267577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,balanced,0.1332533359527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,balanced,0.0352960005402565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,16,power_law_1.2,3.1910911560058595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,balanced,0.13378666838010153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,balanced,0.03472533325354258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,balanced,0.14011733730634054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,balanced,0.03851199895143509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,16,power_law_1.2,5.29633903503418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,balanced,0.059061333537101746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,balanced,0.14448533455530801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,balanced,0.0844586690266927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,balanced,0.08524266878763835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,balanced,0.14945600430170694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,16,power_law_1.2,12.786534118652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,balanced,0.08682666222254436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,balanced,0.155541330575943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,balanced,0.08693333466847737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,balanced,0.08717333277066548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,balanced,0.16358400384585062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,balanced,0.08829333384831746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,balanced,0.08913066983222961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,balanced,0.08964799841245015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,balanced,0.17746132612228394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.01,0.07736319899559022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,balanced,0.0906880001227061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,balanced,0.0930560032526652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.01,0.04971520006656647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,balanced,0.18918933471043906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,balanced,0.09989866614341736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.01,0.05800319910049438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,balanced,0.10033067067464192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.01,0.06488320231437683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,balanced,0.10630399982134502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,balanced,0.2320853273073832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.01,0.08341119885444641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,balanced,0.11400000254313152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.01,0.1167680025100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,balanced,0.02996266633272171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,balanced,0.1241973340511322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,balanced,0.2553013364473979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.01,0.11726720333099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.01,0.054816001653671266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,balanced,0.03084266682465871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,balanced,0.1386240025361379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.01,0.12092800140380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.01,0.04261760115623474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,balanced,0.055760001142819725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.01,0.11954560279846191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.01,0.04108160138130188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,balanced,0.15244266390800476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,balanced,0.07898133496443431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.01,0.12273279428482056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,balanced,0.33965333302815753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,balanced,0.08067733546098073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.01,0.05674880146980286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,balanced,0.08227733274300893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.01,0.12807040214538573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,balanced,0.08251200119654338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,balanced,0.19589867194493613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.01,0.06232320070266724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.01,0.13474559783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,balanced,0.08361066381136577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.01,0.13728640079498292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.01,0.08016639947891235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,balanced,0.08389332890510559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.01,0.14147839546203614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,balanced,0.08538132905960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.01,0.08011519908905029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,balanced,0.2304906646410624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,balanced,0.3777066469192505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,balanced,0.0869813362757365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.01,0.1444607973098755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.01,0.0809984028339386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,balanced,0.08932266632715861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.01,0.08490880131721497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.01,0.15532159805297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,balanced,0.09146666526794434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.01,0.08455680012702942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.01,0.16050560474395753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,balanced,0.3158400058746338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.01,0.17498879432678222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.01,0.09128959774971009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.01,0.20865919589996337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.01,0.09169279932975768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.01,0.22716159820556642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.01,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,balanced,0.09880000352859497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,balanced,0.5550933281580607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.01,0.24681599140167237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,balanced,0.09964799880981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.01,0.09728639721870422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,balanced,0.37615466117858887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.01,0.3388927936553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.01,0.10101759433746338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.01,0.35129599571228026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.01,0.11039999723434449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.01,0.4849855899810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.01,0.11402239799499511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.01,0.6377535820007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.01,0.1244096040725708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.01,0.94268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,balanced,0.10774933298428853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.01,0.14816000461578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,balanced,0.5518186489741007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.01,1.1942784309387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.01,0.174892795085907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,balanced,0.12008000413576762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,balanced,0.6898240248362223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.01,0.20792319774627685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.01,1.4921536445617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,balanced,0.12770133217175803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.01,0.2873471975326538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.01,2.1964288711547852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.01,0.3367487907409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.01,0.42200322151184083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,power_law_1.01,0.05539199709892273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.01,4.694598388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,balanced,0.15550933281580606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.01,0.5967103958129882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,power_law_1.01,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,balanced,0.6980319817860922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,balanced,0.17436800400416055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.01,0.8320639610290528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,power_law_1.01,0.04217599928379059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,power_law_1.01,0.052262401580810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,8,power_law_1.2,0.07715839743614197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.01,1.1367808341979981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,balanced,0.8750933011372884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,balanced,0.261957327524821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,power_law_1.01,0.061887997388839724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,8,power_law_1.2,0.04747520089149475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.01,1.3540224075317382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,8,power_law_1.2,0.05560960173606873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,power_law_1.01,0.07545599937438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.01,2.0496959686279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,balanced,0.31649599472681683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,8,power_law_1.2,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,power_law_1.01,0.0816703975200653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,8,power_law_1.2,0.08835840225219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,power_law_1.01,0.08332160115242004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.01,4.21069450378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,8,power_law_1.2,0.11406079530715943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,power_law_1.01,0.08389120101928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,8,power_law_1.2,0.12436480522155761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,balanced,0.8778080145517985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,power_law_1.01,0.08515840172767639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,8,power_law_1.2,0.12146559953689576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,power_law_1.01,0.09184640049934387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,balanced,0.45213866233825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,8,power_law_1.2,0.12423039674758911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,power_law_1.01,0.09107199907302857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,8,power_law_1.2,0.12920960187911987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,power_law_1.01,0.10170880556106568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,8,power_law_1.2,0.12774399518966675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,power_law_1.01,0.10610560178756714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,8,power_law_1.2,0.13747199773788452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,balanced,0.5749546686808268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,8,power_law_1.2,0.13838720321655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,balanced,1.3728853861490886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,power_law_1.01,0.11427839994430541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,8,power_law_1.2,0.14108799695968627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,power_law_1.01,0.1193343997001648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,8,power_law_1.2,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,8,power_law_1.2,0.16764160394668579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,8,power_law_1.2,0.1645248055458069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,balanced,0.8538080056508383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,power_law_1.01,0.12490240335464478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,8,power_law_1.2,0.18339840173721314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,power_law_1.01,0.15392639636993408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,8,power_law_1.2,0.21191039085388183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,balanced,1.344106674194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,8,power_law_1.2,0.2344831943511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,power_law_1.01,0.17636480331420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,8,power_law_1.2,0.2918976068496704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,power_law_1.01,0.2329792022705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,8,power_law_1.2,0.40191359519958497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,8,power_law_1.2,0.44645118713378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,power_law_1.01,0.26629760265350344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,8,power_law_1.2,0.5382016181945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,balanced,1.1308586597442627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,power_law_1.01,0.4004223823547363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,8,power_law_1.2,0.7617792129516602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,power_law_1.01,0.4969344139099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,8,power_law_1.2,1.0874303817749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,power_law_1.01,0.7716351985931397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,8,power_law_1.2,1.8923839569091796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,power_law_1.01,0.9108799934387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,8,power_law_1.2,2.325312042236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,power_law_1.01,1.4597248077392577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,8,power_law_1.2,3.1881664276123045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,power_law_1.01,1.9093759536743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,power_law_1.2,9.060671997070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,balanced,1.4010079701741536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,power_law_1.01,2.398476791381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,power_law_1.01,3.5895103454589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,8,power_law_1.2,0.05447040200233459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,power_law_1.01,7.4457855224609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,8,power_law_1.2,0.03820799887180328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,8,power_law_1.2,0.04120959937572479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,8,power_law_1.2,0.05013759732246399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,8,balanced,2.737914721171061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,8,power_law_1.2,0.05753600001335144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,8,power_law_1.2,0.08162559866905213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,8,power_law_1.2,0.08300799727439881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,8,power_law_1.2,0.08362879753112792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,8,power_law_1.2,0.08503680229187012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,8,power_law_1.2,0.08840960264205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,8,power_law_1.2,0.09205759763717651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,balanced,2.2321653366088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,balanced,2.612565358479818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,8,power_law_1.2,0.09291520118713378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,8,power_law_1.2,0.09792640209197997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,8,power_law_1.2,0.097952002286911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,8,power_law_1.2,0.10414719581604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,8,power_law_1.2,0.11274240016937256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,8,power_law_1.2,0.11543040275573731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,8,power_law_1.2,0.13654400110244752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,8,power_law_1.2,0.15953919887542725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,8,power_law_1.2,0.18134399652481079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,8,power_law_1.2,0.2363136053085327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,8,power_law_1.2,0.32487680912017824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,8,power_law_1.2,0.36839680671691893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,8,power_law_1.2,0.49553279876708983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,8,power_law_1.2,0.6148352146148681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,8,power_law_1.2,1.1040831565856934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,8,power_law_1.2,1.2872511863708496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,8,power_law_1.2,1.5423168182373046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,8,power_law_1.2,2.5946048736572265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,8,power_law_1.2,5.854668807983399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,balanced,4.399759928385417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,8,power_law_1.2,0.05472000241279602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,8,power_law_1.2,0.03985919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,8,power_law_1.2,0.039929598569869995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,balanced,0.03730133424202601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,8,power_law_1.2,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,balanced,0.039135999977588654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,8,power_law_1.2,0.0559935986995697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,balanced,0.053455998500188194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,8,power_law_1.2,0.07605119943618774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,balanced,0.08078933258851369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,balanced,0.12923199931780496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,8,power_law_1.2,0.0782975971698761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,8,power_law_1.2,0.08191360235214233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,balanced,0.13058132926623026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,8,power_law_1.2,0.08603519797325135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,balanced,0.13174933195114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,8,power_law_1.2,0.08556159734725952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,balanced,0.1325440009435018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,8,power_law_1.2,0.08922240138053894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,balanced,0.13340266545613608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,balanced,0.13307199875513712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,8,power_law_1.2,0.09656959772109985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,8,power_law_1.2,0.09486079812049866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,balanced,0.13311466574668884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,balanced,0.13517333070437113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,8,power_law_1.2,0.11149439811706544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,balanced,0.1363200048605601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,balanced,0.13834666212399802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,8,power_law_1.2,0.11614079475402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,balanced,0.14566933115323386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,balanced,0.1507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,8,power_law_1.2,0.13058559894561766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,balanced,0.1572426656881968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,balanced,0.1711840033531189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,8,power_law_1.2,0.1343808054924011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,balanced,0.1831573247909546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,8,power_law_1.2,0.15334399938583373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,balanced,0.2015413244565328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,8,power_law_1.2,0.17400959730148316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,8,power_law_1.2,0.26087040901184083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,balanced,0.21785066525141397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,8,power_law_1.2,0.33086719512939455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,8,power_law_1.2,0.4319744110107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,balanced,0.278821329275767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,8,power_law_1.2,0.6110527992248536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,balanced,0.32231465975443524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,8,power_law_1.2,0.93820161819458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,8,power_law_1.2,1.0430591583251954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,8,power_law_1.2,1.942144012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,balanced,0.43778133392333984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,8,power_law_1.2,2.7367168426513673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,balanced,0.0336053321758906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,8,power_law_1.2,3.05346565246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,balanced,0.034314667185147606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,balanced,0.039834665755430855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,8,power_law_1.2,4.9195903778076175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,balanced,0.05961066484451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,balanced,0.5171306530634562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,balanced,0.08507200082143147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,balanced,0.08662399649620056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,8,power_law_1.2,13.354214477539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,balanced,0.08776000142097473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.01,0.052076798677444455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,balanced,0.08839999636014302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.01,0.03826560080051422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.01,0.03994239866733551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,balanced,0.03481066723664602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,balanced,0.08875200152397156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.01,0.03985919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.01,0.0511680006980896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,balanced,0.7554186979929606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.01,0.04195199906826019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,balanced,0.03621333340803782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,balanced,0.09051199754079182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.01,0.06435840129852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.01,0.053286397457122804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,balanced,0.04067733387152354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,balanced,0.09150399764378865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.01,0.06064640283584595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.01,0.07491840124130249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,balanced,0.059152002135912575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.01,0.07768319845199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,balanced,0.09340266386667888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.01,0.1151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,balanced,0.08290666838486989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.01,0.08076159954071045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,balanced,0.09470400214195251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,balanced,0.08544533451398213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.01,0.08313599824905396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.01,0.12195839881896972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.01,0.08565120100975036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,balanced,0.08715200424194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,balanced,0.09757333000500996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.01,0.12337919473648071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.01,0.08746240139007569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,balanced,0.08795199791590373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.01,0.09094399809837342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,balanced,0.10636799534161885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.01,0.12216960191726685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,balanced,0.9585973421732584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.01,0.09401599764823913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,balanced,0.08878933389981587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.01,0.09711999893188476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,balanced,0.09036800265312195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.01,0.12775039672851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,balanced,0.10655466715494792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.01,0.09858559966087341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,balanced,0.09264533718427022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.01,0.11330560445785523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.01,0.12789759635925294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,balanced,0.11552533507347107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,balanced,0.09501866499582927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.01,0.11530879735946656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.01,0.12951040267944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.01,0.12749439477920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,balanced,0.12686933080355325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,balanced,0.09889599680900574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.01,0.13965439796447754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.01,0.13597439527511596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,balanced,0.10361066460609436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.01,0.1519551992416382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,balanced,0.13622933626174927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.01,0.19576319456100463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.01,0.14531199932098388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.01,0.21726720333099364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,balanced,0.15652799606323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.01,0.14962559938430786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.01,0.2956543922424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.01,0.15660159587860106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.01,0.34149119853973386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,balanced,0.17744000752766928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,balanced,1.2008106708526611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.01,0.17286399602890015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.01,0.5041471958160401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,balanced,0.11395200093587239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.01,0.5951871871948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.01,0.19366400241851806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,balanced,0.11643200119336446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,balanced,0.24296534061431885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.01,0.8700608253479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.01,0.21695361137390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.01,1.1883839607238769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.01,0.234771203994751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.01,1.4719296455383302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,balanced,0.2935573259989421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.01,0.28047358989715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.01,2.2679935455322267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.01,0.3691200017929077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,power_law_1.01,0.04156799912452698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.01,0.38022398948669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.01,5.0523326873779295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,balanced,0.13237333297729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,power_law_1.01,0.04289279878139496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.01,0.5803711891174317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,balanced,0.41624001661936444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,power_law_1.01,0.04450559914112091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,balanced,0.15505599975585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.01,0.678220796585083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,power_law_1.01,0.05539199709892273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.01,1.002617645263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,4,power_law_1.2,0.051072001457214355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,balanced,0.16125333309173584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,power_law_1.01,0.06276479959487916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.01,1.3434111595153808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,4,power_law_1.2,0.04229759871959686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,power_law_1.01,0.08071680068969726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,balanced,0.5150400002797445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,4,power_law_1.2,0.050470399856567386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.01,1.5369407653808593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,power_law_1.01,0.08413439989089966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,balanced,1.8225919405619304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,4,power_law_1.2,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,4,power_law_1.2,0.07247359752655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.01,2.722764778137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,power_law_1.01,0.0859008014202118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,balanced,0.2248106598854065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,4,power_law_1.2,0.11148799657821655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,power_law_1.01,0.08895999789237977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.01,5.140774536132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,balanced,0.26638933022816974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,power_law_1.01,0.09122560024261475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,4,power_law_1.2,0.1197119951248169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,power_law_1.01,0.09890559911727906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,4,power_law_1.2,0.12653440237045288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,balanced,0.7666506767272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,power_law_1.01,0.10113919973373413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,4,power_law_1.2,0.12778879404067994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,balanced,0.38975465297698975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,4,power_law_1.2,0.13274879455566407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,power_law_1.01,0.11175040006637574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,4,power_law_1.2,0.1325503945350647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,power_law_1.01,0.11561599969863892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,4,power_law_1.2,0.1374848008155823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,balanced,0.4703893264134725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,4,power_law_1.2,0.14012160301208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,4,power_law_1.2,0.1444991946220398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,power_law_1.01,0.1273151993751526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,4,power_law_1.2,0.155840003490448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,4,power_law_1.2,0.16002559661865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,power_law_1.01,0.14375679492950438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,balanced,0.6851627031962076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,4,power_law_1.2,0.18322559595108032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,balanced,0.9913226763407389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,4,power_law_1.2,0.2128063917160034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,4,power_law_1.2,0.2201472043991089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,power_law_1.01,0.14684159755706788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,4,power_law_1.2,0.25632638931274415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,4,power_law_1.2,0.2891263961791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,balanced,0.8907039960225424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,power_law_1.01,0.18053120374679565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,4,power_law_1.2,0.38801279067993166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,power_law_1.01,0.20254080295562743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,4,power_law_1.2,0.4129727840423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,4,power_law_1.2,0.6310783863067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,power_law_1.01,0.29078400135040283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,4,power_law_1.2,0.7161664009094239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,power_law_1.01,0.3523519992828369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,4,power_law_1.2,1.0116031646728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,power_law_1.01,0.5104640007019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,4,power_law_1.2,1.4724160194396974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,balanced,1.2428906758626301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,power_law_1.01,0.6337152004241944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,balanced,1.3231786886850994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,4,power_law_1.2,1.801055908203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,power_law_1.01,0.9229120254516602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,4,power_law_1.2,3.43043212890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,power_law_1.01,1.2133312225341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,power_law_1.01,1.8441280364990233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,power_law_1.2,6.998067474365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,4,balanced,3.5623947779337564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,power_law_1.01,2.603596878051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,power_law_1.01,2.6441856384277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,power_law_1.01,5.252921676635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,balanced,1.7489120165507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,power_law_1.01,8.950348663330079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,balanced,1.8233812650044758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,balanced,2.178373336791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,4,power_law_1.2,0.0381056010723114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,4,power_law_1.2,0.035718399286270144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,4,power_law_1.2,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,4,power_law_1.2,0.051577597856521606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,4,power_law_1.2,0.05725439786911011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,4,power_law_1.2,0.07848320007324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,4,power_law_1.2,0.08213760256767273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,4,power_law_1.2,0.0843455970287323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,4,power_law_1.2,0.08675199747085571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,4,power_law_1.2,0.08820480108261108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,4,power_law_1.2,0.091839998960495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,4,power_law_1.2,0.0964031994342804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,balanced,3.43830935160319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,4,power_law_1.2,0.0980351984500885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,4,power_law_1.2,0.10554239749908448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,4,power_law_1.2,0.11363840103149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,4,power_law_1.2,0.11806720495223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,4,power_law_1.2,0.12298879623413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,4,power_law_1.2,0.14426239728927612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,4,power_law_1.2,0.16767359972000123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,4,power_law_1.2,0.19853440523147584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,4,power_law_1.2,0.23720960617065429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,4,power_law_1.2,0.32055039405822755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,4,power_law_1.2,0.3536639928817749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,balanced,3.645514806111654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,4,power_law_1.2,0.4944447994232178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,4,power_law_1.2,0.7608960151672364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,4,power_law_1.2,1.0487615585327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,4,power_law_1.2,1.35032320022583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,4,power_law_1.2,1.6475263595581056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,4,power_law_1.2,2.888364791870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,4,power_law_1.2,6.555744171142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,4,power_law_1.2,0.04132480025291443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,4,power_law_1.2,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,balanced,6.78546142578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,4,power_law_1.2,0.0403903990983963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,4,power_law_1.2,0.05095679759979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,4,power_law_1.2,0.05817599892616272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,balanced,0.039647998909155525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,4,power_law_1.2,0.08015999794006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,balanced,0.04211199780305227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,4,power_law_1.2,0.08469120264053345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,balanced,0.05493866900602976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,4,power_law_1.2,0.08872320055961609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,balanced,0.07964266836643219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,balanced,0.13134400049845377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,4,power_law_1.2,0.09264000058174134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,balanced,0.13262933492660522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,balanced,0.1341866652170817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,4,power_law_1.2,0.09556480050086975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,balanced,0.13362133502960205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,4,power_law_1.2,0.09937279820442199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,balanced,0.13355732957522073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,balanced,0.13482133547465006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,4,power_law_1.2,0.10773119926452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,balanced,0.13687466581662497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,4,power_law_1.2,0.11136640310287475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,balanced,0.14152533809343973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,4,power_law_1.2,0.12591999769210815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,balanced,0.14105066657066345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,balanced,0.14524267117182413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,balanced,0.15421332915623984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,balanced,0.1618880033493042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,4,power_law_1.2,0.12929919958114625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,balanced,0.17438934246699014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,4,power_law_1.2,0.13784960508346558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,balanced,0.19394665956497192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,balanced,0.2058453361193339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,4,power_law_1.2,0.14927999973297118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,balanced,0.23948800563812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,4,power_law_1.2,0.19070080518722535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,4,power_law_1.2,0.22256639003753662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,balanced,0.26689600944519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,4,power_law_1.2,0.28883841037750246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,balanced,0.3785119851430257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,4,power_law_1.2,0.387827205657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,4,power_law_1.2,0.5398272037506103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,balanced,0.4553866783777873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,balanced,0.03524799893299738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,4,power_law_1.2,0.6534016132354736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,balanced,0.036570665736993156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,balanced,0.042037333051363625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,4,power_law_1.2,1.0418496131896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,balanced,0.6574133237202963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,balanced,0.06572799881299336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,4,power_law_1.2,1.3129728317260743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,balanced,0.09212266405423482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.01,0.04615040123462677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,balanced,0.09675199786822002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,4,power_law_1.2,1.9739519119262696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,balanced,0.09967999656995137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.01,0.041196799278259276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,4,power_law_1.2,2.65600643157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,balanced,0.09872000416119893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,balanced,0.045125335454940796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,balanced,0.823632001876831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,balanced,0.10115200281143188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.01,0.05194240212440491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,4,power_law_1.2,4.115654373168946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,balanced,0.04758933186531067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,balanced,0.10200533270835876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.01,0.06705920100212097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,balanced,0.05233600238958994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,balanced,0.10319466392199199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,balanced,0.07020266850789388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,4,power_law_1.2,5.405068969726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.01,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,balanced,0.10662933190663655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,balanced,0.09909866253534953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,balanced,0.10328533252080281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,balanced,0.10865066448847453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.01,0.1108672022819519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,balanced,0.10544000069300334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,balanced,0.11311999956766765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.01,0.11800320148468017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,4,power_law_1.2,12.027225494384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,balanced,0.10620799660682678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,balanced,1.2183252970377605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,balanced,0.10854400197664897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,balanced,0.12194133798281352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.01,0.12468479871749878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,balanced,0.11136000355084737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,balanced,0.1256106694539388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.01,0.12535040378570556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,balanced,0.11599999666213989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,balanced,0.14101333419481912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,balanced,0.12145599722862244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.01,0.13019520044326782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,balanced,0.1269439955552419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.01,0.137881600856781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,balanced,0.1604373355706533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,balanced,0.1304586629072825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.01,0.1493631958961487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,balanced,0.1718506614367167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.01,0.1498944044113159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.01,0.15345280170440673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,balanced,0.204367995262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,balanced,1.57858673731486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,balanced,0.14988266428311667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.01,0.1602944016456604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,balanced,0.1529759963353475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,balanced,0.23504533370335898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.01,0.17003519535064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.01,0.18110079765319825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,balanced,0.32793599367141724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.01,0.22490239143371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.01,0.2424448013305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.01,0.2684351921081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,balanced,0.18343466520309448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,balanced,0.4237653414408366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.01,0.3101632118225098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.01,0.03866240084171295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,balanced,0.23128533363342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.01,0.4232192039489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.01,0.03819519877433777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,balanced,0.26526399453481037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,balanced,1.9751680692036946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.01,0.5131264209747315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,balanced,0.644320011138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.01,0.7100992202758789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.01,0.0523967981338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.01,0.8621631622314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.01,0.06316800117492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.01,0.08538879752159119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,balanced,0.3701653480529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.01,1.2971136093139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.01,0.08911359906196595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,balanced,0.8344693183898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.01,1.6509632110595702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,balanced,0.4358079830805461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.01,0.09100160002708435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.01,0.09356160163879394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.01,2.11212158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.01,0.09713919758796692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,balanced,0.6611413160959879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,power_law_1.01,0.04467200040817261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.01,3.546662521362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.01,0.10519039630889893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.01,0.10940799713134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,power_law_1.01,0.04707199931144714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.01,0.11845120191574096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.01,7.04691162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,balanced,0.8133653004964193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,power_law_1.01,0.052083200216293334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,balanced,1.2373279730478923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.01,0.11867519617080688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,power_law_1.01,0.06298239827156067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.01,0.12910720109939575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,power_law_1.01,0.07095680236816407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,balanced,1.1918079853057861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,balanced,2.8584267298380532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.01,0.13439359664916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,power_law_1.01,0.0923520028591156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.01,0.15155839920043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,power_law_1.01,0.09971200227737427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,power_law_1.01,0.10393600463867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.01,0.1750208020210266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,power_law_1.01,0.10613759756088256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.01,0.19854719638824464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,balanced,1.556447982788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,balanced,1.6337226231892903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,power_law_1.01,0.11082240343093872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.01,0.23845760822296141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,power_law_1.01,0.12218879461288452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.01,0.29047679901123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,2,power_law_1.2,0.04594559967517853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,power_law_1.01,0.13019520044326782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.01,0.3778111934661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,power_law_1.01,0.13730560541152953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,2,power_law_1.2,0.04180479943752289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.01,0.44483199119567873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,power_law_1.01,0.15374720096588135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,2,power_law_1.2,0.05121279954910278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,balanced,2.3043626149495444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.01,0.65032958984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,2,power_law_1.2,0.061689597368240354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.01,0.8979455947875976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,2,power_law_1.2,0.07338240146636962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,power_law_1.01,0.1675711989402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,2,power_law_1.2,0.11480319499969482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.01,1.2707072257995606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,power_law_1.01,0.1770367980003357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,balanced,2.040426731109619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,2,power_law_1.2,0.12250239849090576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.01,1.7089727401733399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,2,power_law_1.2,0.12456320524215699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,power_law_1.01,0.1964352011680603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.01,2.2089984893798826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,2,power_law_1.2,0.13166719675064087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,power_law_1.01,0.25747199058532716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,balanced,3.0578400293986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,2,power_law_1.2,0.13581440448760987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.01,3.3578750610351564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,power_law_1.01,0.3109760046005249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,2,power_law_1.2,0.14114559888839723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,2,power_law_1.2,0.1474560022354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.01,7.336473846435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,power_law_1.01,0.3997312068939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,2,power_law_1.2,0.15260159969329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,power_law_1.01,0.5252543926239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,2,power_law_1.2,0.15461119413375854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,power_law_1.01,0.7407231807708741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,2,power_law_1.2,0.164409601688385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,power_law_1.01,0.9977343559265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,2,power_law_1.2,0.17079039812088012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,2,power_law_1.2,0.18875520229339598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,power_law_1.01,1.2959936141967774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,2,power_law_1.2,0.22609920501708985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,power_law_1.01,1.7410623550415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,balanced,3.814533233642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,balanced,5.641567866007487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,2,power_law_1.2,0.2468928098678589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,balanced,2.93779722849528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,power_law_1.01,2.5625024795532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,2,power_law_1.2,0.27409920692443845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,power_law_1.01,3.349203109741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,2,power_law_1.2,0.3449023962020874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,power_law_1.01,4.414751815795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,2,power_law_1.2,0.4552000045776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,2,power_law_1.2,0.5530111789703369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,power_law_1.01,6.5944061279296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,2,power_law_1.2,0.7532288074493408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,2,power_law_1.2,1.0041215896606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,power_law_1.01,13.8140869140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,2,power_law_1.2,1.3767552375793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,2,power_law_1.2,2.000627136230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,2,power_law_1.2,2.3324352264404298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,2,power_law_1.2,4.123558425903321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,balanced,6.035952250162761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,2,power_law_1.2,8.291993713378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,2,power_law_1.2,0.03898879885673523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,2,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,2,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,2,power_law_1.2,0.05000960230827332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,2,power_law_1.2,0.05947520136833191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,2,power_law_1.2,0.08614400029182434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,2,power_law_1.2,0.08754559755325317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,2,power_law_1.2,0.09562879800796509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,balanced,5.819264094034831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,2,power_law_1.2,0.09904639720916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,2,power_law_1.2,0.10074880123138427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,2,power_law_1.2,0.10938880443572999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,2,power_law_1.2,0.11502079963684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,2,power_law_1.2,0.11858559846878051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,2,power_law_1.2,0.12162560224533081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,2,power_law_1.2,0.13043199777603148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,2,power_law_1.2,0.14245760440826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,2,power_law_1.2,0.15345280170440673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,2,power_law_1.2,0.1808832049369812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,balanced,11.94043223063151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,2,power_law_1.2,0.20695040225982667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,2,power_law_1.2,0.24486401081085205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,2,power_law_1.2,0.28254079818725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,2,power_law_1.2,0.4066495895385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,2,power_law_1.2,0.4666624069213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,2,power_law_1.2,0.7438144207000732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,2,power_law_1.2,0.9344832420349121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,2,power_law_1.2,1.3801600456237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,2,power_law_1.2,1.8930944442749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,2,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,2,power_law_1.2,2.2922176361083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,2,power_law_1.2,0.048467200994491574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,2,power_law_1.2,0.05199360251426697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,2,power_law_1.2,3.7248512268066407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,2,power_law_1.2,0.06069120168685913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,2,power_law_1.2,0.06711040139198303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,2,power_law_1.2,7.298777770996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,2,power_law_1.2,0.09484800100326538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,2,power_law_1.2,0.1007807970046997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,2,power_law_1.2,0.1047104001045227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,2,power_law_1.2,0.1131327986717224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,2,power_law_1.2,0.1129472017288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,2,power_law_1.2,0.12424319982528687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,2,power_law_1.2,0.13734400272369385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,2,power_law_1.2,0.14268800020217895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,2,power_law_1.2,0.1513152003288269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,2,power_law_1.2,0.16888320446014404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,2,power_law_1.2,0.18152320384979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,2,power_law_1.2,0.19404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,2,power_law_1.2,0.26810879707336427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,balanced,0.04043200115362803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,2,power_law_1.2,0.3265343904495239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,balanced,0.046426668763160706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,2,power_law_1.2,0.43992319107055666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,balanced,0.05967999994754791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,2,power_law_1.2,0.5366591930389404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,balanced,0.0925439993540446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,2,power_law_1.2,0.7063488006591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,balanced,0.14892799655596414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,2,power_law_1.2,0.9869631767272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,balanced,0.15075733264287314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,balanced,0.15265066425005594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,2,power_law_1.2,1.3127296447753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,balanced,0.1539359986782074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,2,power_law_1.2,1.7236799240112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,balanced,0.15461333592732748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,balanced,0.15758933623631796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,2,power_law_1.2,2.8705728530883787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,balanced,0.0410453329483668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,balanced,0.16211733222007751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,2,power_law_1.2,3.9325630187988283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,balanced,0.16456533471743265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,balanced,0.07560533285140991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,balanced,0.16849066813786825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,2,power_law_1.2,5.009772872924804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,balanced,0.11409599582354228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,balanced,0.17803200085957846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,balanced,0.11626666784286499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,2,power_law_1.2,7.653830718994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,balanced,0.18653867642084757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,balanced,0.11877866586049397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,balanced,0.19323732455571493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,balanced,0.1197760005791982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,2,power_law_1.2,14.360633850097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,balanced,0.21730667352676392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,balanced,0.12213333447774251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,balanced,0.254528005917867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,balanced,0.12297067046165466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,balanced,0.12602133552233377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,balanced,0.2691626747449239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,balanced,0.13057600458463034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,balanced,0.3205333352088928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,balanced,0.13424533605575562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,balanced,0.14414933323860168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,balanced,0.35974931716918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,balanced,0.15583999951680502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,balanced,0.16470932960510254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.0381056010723114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,balanced,0.5474026600519816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,balanced,0.1885333259900411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.041817599534988405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,balanced,0.21293866634368896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.06948480010032654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,balanced,0.7124319871266683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,balanced,0.2361066738764445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.08817920088768005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,balanced,0.2900906602541606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.1276479959487915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.13567999601364136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,balanced,0.3417493502298991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,balanced,1.0818400382995605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.14006400108337402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,balanced,0.5084746678670248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.14865280389785768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.15144959688186646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.16171519756317138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,balanced,1.4521387418111165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,balanced,0.6379733482996622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.03596799969673157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.17766400575637817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.03837440013885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.197324800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.19455360174179076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.05863680243492127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.20003840923309327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,balanced,1.059333324432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.06826239824295044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.21241600513458253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.10145280361175538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.10870399475097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.23590400218963622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,balanced,2.179962635040283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.11025279760360718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.2860415935516357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.11705600023269654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.3180351972579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.12303999662399293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,balanced,1.4181866645812988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.12911360263824462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.36041600704193116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.13819520473480223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.4476799964904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.14691840410232543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.5936831951141357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.15145599842071533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.16613759994506835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.7497920036315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.17750400304794312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.19639040231704713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.01,1.0807040214538575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,balanced,2.9367411931355796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.22629759311676026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,balanced,2.1429012616475425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.2705600023269653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.01,1.4186047554016112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.3350080013275146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.3955647945404053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.01,2.075679969787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,0.5358463764190674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.01,2.7879104614257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,0.6842559814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,0.9977472305297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.01,3.500806427001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,1.3210495948791503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.01,5.771827316284179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,2.0086719512939455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,2.6105791091918946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,balanced,2.6492640177408853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.01,11.486867523193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.01,3.278969573974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,balanced,3.6792214711507163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.01,5.423654556274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.01,10.944345855712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.06470400094985962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.13058559894561766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.1408959984779358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,balanced,3.3254400889078775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.14699519872665406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.15085439682006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.15483520030975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.16847360134124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.19034240245819092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.19617919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.19253120422363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,balanced,5.38424555460612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.20396161079406738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.21570560932159424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.23879680633544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.2880768060684204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.31912319660186766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.36574079990386965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.45235838890075686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,balanced,5.239786783854167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.5979263782501221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.7556159973144532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,1,power_law_1.2,1.0935935974121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,1,power_law_1.2,1.446399974822998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,1,power_law_1.2,2.134886360168457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,1,power_law_1.2,2.8400896072387694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,1,power_law_1.2,0.03596799969673157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,1,power_law_1.2,3.546265411376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,1,power_law_1.2,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,1,power_law_1.2,5.735187149047851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,1,power_law_1.2,0.04570240080356598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,1,power_law_1.2,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,1,power_law_1.2,0.06699519753456115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,power_law_1.2,11.426713562011718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,1,power_law_1.2,0.10066560506820679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,1,power_law_1.2,0.10670720338821411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,1,power_law_1.2,0.11336959600448608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,1,power_law_1.2,0.11941759586334229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,1,power_law_1.2,0.1217919945716858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,1,power_law_1.2,0.13581440448760987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,1,power_law_1.2,0.140774405002594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,1,balanced,10.779642740885416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,1,power_law_1.2,0.14974720478057862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,1,power_law_1.2,0.154310405254364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,1,power_law_1.2,0.169760000705719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,1,power_law_1.2,0.17916159629821776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,1,power_law_1.2,0.19887360334396362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,1,power_law_1.2,0.2318272113800049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,balanced,10.880821228027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,1,power_law_1.2,0.2768512010574341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,1,power_law_1.2,0.3386624097824097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,1,power_law_1.2,0.3998656034469604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,1,power_law_1.2,0.5380352020263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,1,power_law_1.2,0.6908607959747315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,1,power_law_1.2,1.0198783874511719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,1,power_law_1.2,1.3641983985900878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,1,power_law_1.2,2.038694381713867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,1,power_law_1.2,2.6748479843139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,1,power_law_1.2,3.3726528167724608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,1,power_law_1.2,5.465593719482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,1,power_law_1.2,10.988365173339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,balanced,0.06648000081380208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,balanced,0.08650133013725281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,balanced,0.06364800035953522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,balanced,0.07706666489442189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,balanced,0.07319466769695282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,balanced,0.10300266742706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,balanced,0.11002666751543681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,balanced,0.16223999857902527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,balanced,0.17485866943995157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,balanced,0.29290133714675903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,balanced,0.21157334248224893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,balanced,0.3475786844889323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,balanced,0.34779731432596844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,balanced,0.212336003780365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,balanced,0.21331199010213217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,balanced,0.34861334164937335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,balanced,0.2147093415260315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,balanced,0.3491946856180827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,balanced,0.21434666713078818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,balanced,0.350053350130717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,balanced,0.2164213260014852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,balanced,0.35151998202006024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,balanced,0.21734933058420816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,balanced,0.35328535238901776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,balanced,0.05872533222039541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,balanced,0.3545120159784953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,balanced,0.22062400976816812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,balanced,0.05643199880917867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,balanced,0.3568426767985026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,balanced,0.22286399205525717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,balanced,0.0776800016562144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,balanced,0.36354132493336994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,balanced,0.22993600368499756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,balanced,0.11804266770680745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,balanced,0.16821332772572836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,balanced,0.2374239961306254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,balanced,0.3810666799545288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,balanced,0.20438933372497559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,balanced,0.20723199844360352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,balanced,0.2360693415006002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,balanced,0.3884799877802531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,balanced,0.20721065998077393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,balanced,0.2619733413060506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,balanced,0.20753065745035806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,balanced,0.40261868635813397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,balanced,0.20933334032694498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,balanced,0.2608106732368469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,balanced,0.21232000986735025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,balanced,0.4113173484802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,balanced,0.2125920057296753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,balanced,0.2164319952329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,balanced,0.3009919921557109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,balanced,0.4430453379948934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,balanced,0.21947733561197916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,balanced,0.22588799397150675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,balanced,0.3044053316116333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,balanced,0.4427786668141683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,balanced,0.42027199268341064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,balanced,0.6238133509953817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,balanced,0.2291839917500814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,balanced,0.4105493227640788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,balanced,0.5380693276723226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,balanced,0.2392586668332418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,balanced,0.6689600149790446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,balanced,0.9289920330047607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.01,0.2880511999130249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.01,0.34114561080932615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.01,0.14761600494384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,balanced,0.7098399798075358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.01,0.19538559913635253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,balanced,0.8939680258433024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.01,0.23909120559692382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,balanced,0.24781332413355509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.01,0.2998143911361694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.01,0.2998847961425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,balanced,0.26232000192006427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.01,0.3276671886444092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.01,0.3453759908676147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.01,0.34155519008636476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,balanced,0.9094666639963785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,balanced,1.5493440628051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.01,0.357696008682251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.16676479578018188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.01,0.3651904106140137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.01,0.37112960815429685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.20126080513000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.01,0.3733952045440674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,balanced,0.2942879994710286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.08709759712219238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.01,0.4083968162536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.1390720009803772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,balanced,0.31997867425282794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.01,0.42124161720275877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.14384000301361083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,power_law_1.01,0.1667072057723999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.01,0.4357312202453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.1815616011619568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,balanced,1.212224006652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,power_law_1.01,0.1434175968170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,balanced,1.5247999827067058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.18570239543914796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.01,0.5102591991424561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,power_law_1.01,0.09056000113487243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.1808127999305725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.01,0.5448192119598388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,power_law_1.01,0.13134080171585083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.196288001537323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.01,0.6541376113891602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,balanced,0.4379146496454875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,power_law_1.01,0.1229375958442688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.01,0.6819200038909912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.18991999626159667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,power_law_1.01,0.1783360004425049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.01,0.8658432006835938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,power_law_1.01,0.18837759494781495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.2007807970046997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,balanced,0.5065439939498901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,power_law_1.01,0.20071039199829102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.01,0.9540927886962891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.2082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,power_law_1.01,0.19409279823303222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.21617279052734376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.01,1.33821439743042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,power_law_1.01,0.19913599491119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.23814399242401124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,power_law_1.01,0.2127295970916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.01,1.6509504318237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,balanced,1.3571200370788574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,power_law_1.01,0.22584319114685059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.24839680194854735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,power_law_1.01,0.23729920387268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,balanced,1.6944053967793782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.01,2.372870445251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.26156160831451414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,power_law_1.01,0.25408639907836916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.2624063968658447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.01,3.277151870727539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,balanced,0.7126186688741049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,power_law_1.01,0.2880768060684204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.3104448080062866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.01,3.977299118041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.32810239791870116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,0.393068790435791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,power_law_1.01,0.25470719337463377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.01,6.284064102172851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,0.40919041633605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,16,power_law_1.2,0.28669440746307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,balanced,0.9583360354105631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,0.5510079860687256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.19283839464187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,16,power_law_1.2,0.17824000120162964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,0.6651455879211425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.01,11.443571472167969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,power_law_1.01,0.2755903959274292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,16,power_law_1.2,0.13621120452880858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.11330560445785523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,0.8358976364135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,16,power_law_1.2,0.1931007981300354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.09427199959754944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,16,power_law_1.2,0.20555520057678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,0.9764351844787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.11645439863204957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,16,power_law_1.2,0.3219264030456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,power_law_1.01,0.2990976095199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,1.6067392349243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,16,power_law_1.2,0.32556800842285155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.12712960243225097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.01,0.34266879558563235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,balanced,1.304693301518758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,2.0422784805297853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,16,power_law_1.2,0.333951997756958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.1738111972808838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,balanced,2.2419892946879068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,16,power_law_1.2,0.33157761096954347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.1897663950920105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.01,2.375142478942871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,balanced,2.8951679865519204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,16,power_law_1.2,0.340012788772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.1821887969970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.01,0.4455423831939697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.01,3.8483009338378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,16,power_law_1.2,0.35401599407196044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.2035072088241577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.01,0.518943977355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,16,power_law_1.2,0.38172800540924073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.2033600091934204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.01,7.650054168701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,16,power_law_1.2,0.4175551891326904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.20371201038360595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.01,0.7103360176086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,16,power_law_1.2,0.3900608062744141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.21365759372711182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,balanced,1.748293399810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.21722879409790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,16,power_law_1.2,0.4198463916778564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.01,0.8550848007202149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.2479935884475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,16,power_law_1.2,0.45603199005126954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.2895103931427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,16,power_law_1.2,0.4368768215179443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.01,1.2743871688842774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.29251201152801515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,16,power_law_1.2,0.6087103843688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.28225278854370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.01,1.7944511413574218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.3506688117980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,16,power_law_1.2,0.609171199798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.01,2.9488895416259764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.364518404006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,16,power_law_1.2,0.7726016044616699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,0.3977407932281494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.01,3.197158432006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,16,power_law_1.2,0.7512447834014893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,balanced,2.088373343149821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,0.46300158500671384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,16,power_law_1.2,1.0423104286193847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,power_law_1.01,4.087200164794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,0.6169983863830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,16,power_law_1.2,1.212019157409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,0.7568704128265381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,power_law_1.01,7.932396697998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,1.0623552322387695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,16,power_law_1.2,1.6000896453857423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,1.522886371612549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,power_law_1.01,14.172154235839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,16,power_law_1.2,2.2575040817260743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,2.3345279693603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,16,power_law_1.2,3.2419071197509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,2.7787328720092774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,16,power_law_1.2,4.308544158935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,16,power_law_1.2,3.489593505859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,16,power_law_1.2,4.860492706298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,16,power_law_1.2,5.116243362426758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,balanced,4.182448069254558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,16,power_law_1.2,9.562226867675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,balanced,5.185152053833008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,16,power_law_1.2,14.388441467285157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,balanced,3.323925336201986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,16,power_law_1.2,17.569287109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,balanced,6.678533554077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,16,power_law_1.2,0.16721919775009156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,16,power_law_1.2,0.10456960201263428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,16,power_law_1.2,0.07847679853439331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,16,power_law_1.2,0.10583679676055908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,16,power_law_1.2,0.12859519720077514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,16,power_law_1.2,0.1843392014503479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,16,power_law_1.2,0.1768704056739807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,balanced,0.06357866525650024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,16,power_law_1.2,0.1902783989906311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,balanced,0.07161599894364674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,16,power_law_1.2,0.21022720336914064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,balanced,0.10378133257230122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,16,power_law_1.2,0.21445119380950928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,balanced,0.16133866707483926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,balanced,0.29764799276987713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,16,power_law_1.2,0.2180095911026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,balanced,0.3634186585744222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,balanced,0.3636853297551473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,16,power_law_1.2,0.22234880924224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,balanced,0.3507946729660034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,balanced,0.35259731610616046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,16,power_law_1.2,0.23542399406433107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,balanced,0.3534506559371948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,16,power_law_1.2,0.2703039884567261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,balanced,0.3545173406600952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,balanced,0.3566933472951253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,16,power_law_1.2,0.28574719429016116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,balanced,0.3582719961802165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,balanced,0.36300798257191974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,balanced,0.369920015335083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,16,power_law_1.2,0.28702080249786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,balanced,0.3857119878133138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,balanced,0.39652268091837567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,balanced,0.05091199775536855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,balanced,0.4082080125808716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,16,power_law_1.2,0.3010879993438721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,balanced,0.05645333230495453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,balanced,0.4222773313522339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,balanced,0.0740586668252945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,balanced,0.1111946702003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,balanced,0.17096533377965292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,balanced,0.4675573507944743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,16,power_law_1.2,0.3335616111755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,balanced,0.20407466093699136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,balanced,0.2074026664098104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.2,0.40158720016479493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,balanced,0.46511467297871906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,balanced,0.21052799622217813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,balanced,0.21089067061742148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,balanced,0.2128373384475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,balanced,0.6722453435262045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.2,0.5022592067718505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,balanced,0.2145813306172689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,balanced,0.21500267585118613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.2,0.631987190246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,balanced,0.2193066676457723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,balanced,0.590399980545044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,balanced,0.22099200884501138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.2,0.8023488044738769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,balanced,0.22744532426198324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.01,0.18005759716033937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.2,1.2893759727478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.01,0.1162559986114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,balanced,0.242959996064504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.01,0.20508160591125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,balanced,0.956384023030599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.2,1.619558334350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.01,0.12576639652252197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,balanced,0.23638399442036948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.01,0.12090239524841309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.01,0.07965440154075623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.2,1.8929536819458008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,balanced,0.26132800181706745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.01,0.1876863956451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.01,0.11952639818191528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.2,4.008505630493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,balanced,0.2696693340937297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,balanced,0.04689066608746847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.01,0.1871999979019165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,power_law_1.01,0.10960639715194702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.01,0.13290879726409913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.2,4.69422721862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,balanced,0.9646399815877279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.01,0.29132800102233886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,balanced,0.056074668963750206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.01,0.1712448000907898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,balanced,0.3199946681658427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,power_law_1.01,0.14657280445098878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,16,power_law_1.2,6.4970558166503904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.01,0.3095871925354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,balanced,0.0772266685962677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.01,0.19240959882736205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,power_law_1.01,0.07668480277061462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,balanced,0.3258879979451497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.01,0.31658239364624025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,balanced,0.1158026655515035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.01,0.18926719427108765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,power_law_1.01,0.10515199899673462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,16,power_law_1.2,10.902534484863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,balanced,0.1742666761080424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.01,0.3234240055084229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.01,0.19393279552459716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,power_law_1.01,0.13109760284423827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,balanced,0.20592532555262247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,balanced,0.43330132961273193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.01,0.31548800468444826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.01,0.1982143998146057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,power_law_1.01,0.1665536046028137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,balanced,1.2385599613189697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,16,power_law_1.2,19.877139282226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,balanced,0.20807466904322305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.01,0.34306559562683103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.01,0.20908799171447753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,power_law_1.01,0.1789888024330139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,balanced,0.2068586746851603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,balanced,0.4538293282190959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.01,0.20484480857849122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.01,0.3625920057296753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,power_law_1.01,0.18754559755325317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,balanced,0.20922666788101196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.01,0.2106112003326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.01,0.37059841156005857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,power_law_1.01,0.19495680332183837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,balanced,0.21126933892567953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.01,0.22914559841156007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,power_law_1.01,0.20606720447540283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.01,0.40862717628479006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,balanced,0.21416000525156656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,balanced,0.6893920103708903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.01,0.2443903923034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,power_law_1.01,0.21402881145477295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.01,0.44158082008361815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,balanced,0.21521600087483725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.01,0.26997759342193606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,power_law_1.01,0.21403520107269286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.01,0.42928638458251955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,balanced,0.22016533215840658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,balanced,1.6397387186686199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.01,0.2593919992446899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,power_law_1.01,0.2211519956588745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.01,0.40059518814086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,balanced,0.2237280011177063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,8,power_law_1.2,0.18002560138702392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.01,0.2899519920349121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,power_law_1.01,0.24230399131774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.01,0.5004928112030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,balanced,0.23273066679636636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,balanced,0.7954133351643881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,8,power_law_1.2,0.0970304012298584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.01,0.30078079700469973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,power_law_1.01,0.280947208404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.01,0.48708481788635255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,8,power_law_1.2,0.11330560445785523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.01,0.36957440376281736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,8,power_law_1.2,0.14252159595489503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.01,0.6088704109191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.01,0.3843519926071167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,8,power_law_1.2,0.18001279830932618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.01,0.5055615901947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.01,0.5800511837005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,8,power_law_1.2,0.2939455986022949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,power_law_1.01,0.26791679859161377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,balanced,0.23782400290171304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,8,power_law_1.2,0.31984639167785645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.01,0.66212477684021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.01,0.7450560092926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,8,power_law_1.2,0.32951040267944337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,balanced,1.0327093601226807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.01,0.8899135589599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.01,0.9175488471984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,8,power_law_1.2,0.3283263921737671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,balanced,1.8408640225728352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.01,1.076748752593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.01,1.2503168106079101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,8,power_law_1.2,0.3389951944351196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.01,1.5295040130615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,8,power_law_1.2,0.3606400012969971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.01,1.5939200401306153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,power_law_1.01,0.28652799129486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,balanced,0.25038933753967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,8,power_law_1.2,0.3899327993392944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.01,2.0135936737060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.01,2.0159423828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,8,power_law_1.2,0.3748863935470581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,8,power_law_1.2,0.4187583923339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.01,2.42663688659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.01,2.2243648529052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,8,power_law_1.2,0.449721622467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,8,power_law_1.2,0.45815038681030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.01,3.300179290771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.01,3.690342330932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,balanced,1.3476212819417317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,8,power_law_1.2,0.4552639961242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,8,power_law_1.2,0.5318784236907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.01,4.791481781005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,8,power_law_1.2,0.5230144023895263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.01,6.337260818481445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,8,power_law_1.2,0.6403264045715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,power_law_1.01,0.3074879884719849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,balanced,0.26082666714986164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.01,9.38766098022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,8,power_law_1.2,0.5824831962585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,power_law_1.01,0.35185918807983396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,8,power_law_1.2,0.7620927810668945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,balanced,0.2776266733805339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,8,power_law_1.2,1.0179264068603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,8,power_law_1.2,1.4583104133605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,8,power_law_1.2,1.6905344009399415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,balanced,3.1469974517822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,8,power_law_1.2,2.377516746520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,balanced,1.6214879353841145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,8,power_law_1.2,3.2325889587402346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,power_law_1.01,0.4586751937866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,8,power_law_1.2,4.665804672241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,balanced,0.32445865869522095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,power_law_1.01,0.5378623962402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,8,power_law_1.2,6.364940643310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,balanced,0.3733706474304199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,power_law_1.2,16.481004333496095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,power_law_1.01,0.7345791816711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,balanced,0.5195573170979818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,power_law_1.01,0.9760895729064941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,balanced,0.6052960157394409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,power_law_1.01,1.4332032203674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,power_law_1.01,1.5789504051208496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,balanced,2.517365296681722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,power_law_1.01,2.4045055389404295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,balanced,0.86135466893514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,power_law_1.01,3.3230911254882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,power_law_1.01,4.586470413208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,balanced,1.1392800013224285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,power_law_1.01,7.5229949951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,power_law_1.01,12.724179077148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,balanced,1.5746986071268718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,8,balanced,5.64243761698405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,balanced,2.0978825887044272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,balanced,4.778074582417806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,balanced,2.5306026140848794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,8,power_law_1.2,0.11712000370025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,8,power_law_1.2,0.08734719753265381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,8,power_law_1.2,0.08037760257720947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,8,power_law_1.2,0.10405759811401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,8,power_law_1.2,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,8,power_law_1.2,0.17244800329208373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,8,power_law_1.2,0.18366719484329225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,8,power_law_1.2,0.1834944009780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,8,power_law_1.2,0.18504960536956788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,balanced,4.068671862284343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,8,power_law_1.2,0.19535360336303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,8,power_law_1.2,0.2054271936416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,8,power_law_1.2,0.2133568048477173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,8,power_law_1.2,0.2158911943435669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,8,power_law_1.2,0.22514560222625732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,8,power_law_1.2,0.2533247947692871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,8,power_law_1.2,0.2822720050811768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,8,power_law_1.2,0.26793599128723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,8,power_law_1.2,0.2990015983581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,8,power_law_1.2,0.3456383943557739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,8,power_law_1.2,0.42259840965270995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,8,power_law_1.2,0.42812161445617675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,8,power_law_1.2,0.5346496105194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,8,power_law_1.2,0.722815990447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,8,power_law_1.2,0.8871423721313476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,8,power_law_1.2,1.2398336410522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,8,power_law_1.2,1.949567985534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,balanced,0.061103999614715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,8,power_law_1.2,2.352652740478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,balanced,0.07141333321730296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,8,power_law_1.2,2.8108800888061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,balanced,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,balanced,0.16204266746838888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,8,power_law_1.2,0.1162943959236145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,8,power_law_1.2,4.93699836730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,balanced,0.30403733253479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,8,power_law_1.2,0.07357439994812012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,balanced,0.3634186585744222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,8,power_law_1.2,9.98502426147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,balanced,0.36535465717315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,8,power_law_1.2,0.0770687997341156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,balanced,0.3543519973754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,8,power_law_1.2,0.11068799495697021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,balanced,0.3550879955291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,balanced,0.04870399832725525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,balanced,0.3555306593577067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,8,power_law_1.2,0.12469760179519654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,balanced,0.05684266487757365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,balanced,8.161429087320963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,balanced,0.3585760196050008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,8,power_law_1.2,0.18109439611434935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,balanced,0.36340800921122235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,balanced,0.07351999978224437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,8,power_law_1.2,0.17623039484024047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,balanced,0.3643946647644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,balanced,0.11255466938018799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,balanced,0.36972800890604657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,8,power_law_1.2,0.1970304012298584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,balanced,0.1745599905649821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,balanced,0.3773813247680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,balanced,0.2082080046335856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,8,power_law_1.2,0.20254080295562743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,balanced,0.4022453228632609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,8,power_law_1.2,0.20908799171447753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,balanced,0.21049600839614868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,balanced,0.4085386594136556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,8,power_law_1.2,0.21404800415039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,balanced,0.21410133441289267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,balanced,0.215664009253184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,8,power_law_1.2,0.23276159763336182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,balanced,0.49210135142008465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,balanced,0.21714133024215698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,8,power_law_1.2,0.24119679927825927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,balanced,0.4482719898223877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,8,power_law_1.2,0.2607935905456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,balanced,0.21766932805379233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,8,power_law_1.2,0.29107840061187745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,balanced,0.22107734282811484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,balanced,0.521226684252421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,balanced,0.22061866521835327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,balanced,0.22539732853571573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,balanced,0.514842669169108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,8,power_law_1.2,0.2730304002761841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,balanced,0.23525333404541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,balanced,0.25149865945180255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,balanced,0.6887786388397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,balanced,0.24809066454569498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,8,power_law_1.2,0.3113343954086304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,balanced,0.292794664700826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,balanced,0.6779253482818604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,balanced,0.29290133714675903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,8,power_law_1.2,0.3460095882415771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,balanced,0.3785173495610555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,8,power_law_1.2,0.3930943965911865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.01,0.10058239698410035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,balanced,1.0402666727701824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,balanced,0.052330667773882546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,balanced,0.3737599849700928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.01,0.11991679668426514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,8,power_law_1.2,0.4937407970428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,balanced,0.060991997520128884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.01,0.09397760033607483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,balanced,0.07924266656239827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,8,power_law_1.2,0.640121603012085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.01,0.14767359495162963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,balanced,0.49162666002909344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,balanced,0.11753066380818684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.01,0.18284159898757935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,balanced,1.1622933546702068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,8,power_law_1.2,0.7906943798065186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,balanced,0.1718719998995463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.01,0.29076480865478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,balanced,0.2080906629562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,balanced,0.5460106531778971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.01,0.3063231945037842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,8,power_law_1.2,1.0714943885803223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.01,0.3151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,balanced,0.21050133307774863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.01,0.3166975975036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,8,power_law_1.2,1.4573887825012206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,balanced,0.21386132637659708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.01,0.31763200759887694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,8,power_law_1.2,2.0763008117675783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,balanced,0.21702400843302408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,balanced,0.8150986830393473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.01,0.3420799970626831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,balanced,1.4821707407633464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,8,power_law_1.2,3.366495895385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,balanced,0.21751999855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,balanced,0.22203733523686728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.01,0.35928959846496583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,8,power_law_1.2,4.212998580932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,balanced,0.22551999489466348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.01,0.362009596824646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,balanced,0.2288693388303121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,8,power_law_1.2,5.024812698364258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,balanced,0.9582826296488444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.01,0.37500159740447997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,balanced,0.23685866594314575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.01,0.07192959785461425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.01,0.4019904136657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,balanced,0.24952532847722372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,8,power_law_1.2,11.351840209960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.01,0.4243584156036377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.01,0.08595200181007386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.01,0.41794562339782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.01,0.06835200190544129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,balanced,1.9164533615112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.01,0.48772478103637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.01,0.10408320426940917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,8,power_law_1.2,20.66460723876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.01,0.5045567989349365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.01,0.12334719896316529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,balanced,0.25756265719731647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,balanced,1.2945013046264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.01,0.168230402469635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.01,0.5477824211120605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.01,0.17864320278167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.01,0.6458111763000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.01,0.18243199586868286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.01,0.7713215827941895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.01,0.18789759874343873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.01,0.9057279586791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,balanced,0.2723466753959656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.01,0.19411200284957886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.01,0.20203518867492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.01,1.2433343887329102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.01,0.20817279815673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.01,0.2092672109603882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.01,1.5214655876159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,balanced,2.2851413091023765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,balanced,1.6983946164449055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.01,0.21996159553527833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.01,2.4722944259643556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.01,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,balanced,0.30421332518259686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.01,2.6745344161987306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.01,0.24291200637817384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.01,0.26232318878173827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,balanced,0.3449813524881999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.01,3.355699157714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.01,0.29674880504608153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.01,0.3119488000869751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.01,4.987769699096679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.01,0.38593919277191163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.01,0.45299201011657714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,balanced,0.42581868171691895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.01,9.38086395263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.01,0.5297344207763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.01,0.671014404296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,balanced,2.043951988220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,balanced,0.4981706539789836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.01,0.9079360008239746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.01,1.1023039817810059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.01,1.5799872398376464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.01,2.042732810974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.01,2.674380874633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,balanced,3.6705652872721353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,balanced,0.7217439810434977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.01,4.3780864715576175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.01,8.039590454101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,balanced,0.8745333353678385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,balanced,1.2404266993204753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,balanced,3.2068052291870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,balanced,1.6273493766784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,4,power_law_1.2,0.11187200546264649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,4,power_law_1.2,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,4,power_law_1.2,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,4,power_law_1.2,0.13875839710235596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,4,power_law_1.2,0.17414400577545167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,power_law_1.01,0.08486400246620178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,4,power_law_1.2,0.27013120651245115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,balanced,2.28163735071818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,power_law_1.01,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,4,power_law_1.2,0.2966912031173706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,power_law_1.01,0.07198079824447631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,4,power_law_1.2,0.30188798904418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,power_law_1.01,0.10087679624557495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,4,power_law_1.2,0.32728960514068606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,power_law_1.01,0.12615679502487182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,4,power_law_1.2,0.3404223918914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,power_law_1.01,0.18293119668960572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,4,power_law_1.2,0.3565439939498901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,power_law_1.01,0.18535679578781128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,4,power_law_1.2,0.3734015941619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,power_law_1.01,0.19440000057220458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,4,power_law_1.2,0.36884479522705077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,balanced,3.0342238744099936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,power_law_1.01,0.18958719968795776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,4,power_law_1.2,0.3962111949920654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,balanced,6.873658498128255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,power_law_1.01,0.20728321075439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,4,power_law_1.2,0.4316671848297119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,power_law_1.01,0.2145983934402466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,4,power_law_1.2,0.42668800354003905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,power_law_1.01,0.22083840370178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,4,power_law_1.2,0.44671998023986814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,power_law_1.01,0.24131839275360106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,4,power_law_1.2,0.539788818359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,power_law_1.01,0.2583679914474487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,4,power_law_1.2,0.5088575839996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,power_law_1.01,0.280403208732605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,4,power_law_1.2,0.6271488189697265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,4,power_law_1.2,0.6527359962463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,balanced,3.6885334650675454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,balanced,6.24667231241862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,4,power_law_1.2,0.876467227935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,power_law_1.01,0.28086400032043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,4,power_law_1.2,0.9813247680664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,4,power_law_1.2,1.3085375785827638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,power_law_1.01,0.3147968053817749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,4,power_law_1.2,1.8167552947998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,4,power_law_1.2,2.326483154296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,power_law_1.01,0.3524735927581787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,4,power_law_1.2,3.2871681213378907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,power_law_1.01,0.41149439811706545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,4,power_law_1.2,3.45546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,power_law_1.01,0.5079616069793701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,4,power_law_1.2,6.319558334350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,power_law_1.01,0.5987135887145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,power_law_1.01,0.889798355102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,4,power_law_1.2,11.712921905517579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,balanced,5.874586741129558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,power_law_1.01,1.0381248474121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,power_law_1.01,1.5297856330871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,power_law_1.01,1.9376256942749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,power_law_1.01,2.913894462585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,power_law_1.01,4.1171520233154295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,power_law_1.01,4.645119857788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,4,power_law_1.2,0.076665598154068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,power_law_1.01,7.910214233398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,4,power_law_1.2,0.06207360029220581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,4,power_law_1.2,0.07388160228729249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,power_law_1.01,15.4246337890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,4,power_law_1.2,0.0919871985912323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,4,power_law_1.2,0.10119040012359619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,4,power_law_1.2,0.17278079986572265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,4,power_law_1.2,0.17573120594024658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,4,power_law_1.2,0.18865280151367186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,4,power_law_1.2,0.19288320541381837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,4,power_law_1.2,0.20127999782562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,4,power_law_1.2,0.20500481128692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,4,power_law_1.2,0.21608319282531738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,4,power_law_1.2,0.22406399250030518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,4,power_law_1.2,0.22160639762878417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,4,power_law_1.2,0.24960000514984132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,4,power_law_1.2,0.2703808069229126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,4,power_law_1.2,0.27153921127319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,4,power_law_1.2,0.3100287914276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,4,power_law_1.2,0.3214272022247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,4,power_law_1.2,0.40595197677612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,4,power_law_1.2,0.4505472183227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,4,power_law_1.2,0.08506240248680115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,balanced,11.780879974365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,4,power_law_1.2,0.5929728031158448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,4,power_law_1.2,0.7329279899597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,4,power_law_1.2,0.06684799790382386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,4,power_law_1.2,0.97325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,4,power_law_1.2,0.07273600101470948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,4,power_law_1.2,1.112825584411621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,4,power_law_1.2,0.09262719750404358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,4,power_law_1.2,2.0163007736206056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,4,power_law_1.2,0.11011199951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,balanced,0.062218666076660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,4,power_law_1.2,2.3753408432006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,4,power_law_1.2,0.17905919551849364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,4,power_law_1.2,3.0413951873779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,balanced,0.07326399783293407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,4,power_law_1.2,0.18178559541702272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,balanced,0.10398399829864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,4,power_law_1.2,4.958380889892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,4,power_law_1.2,0.18760960102081298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,balanced,0.1644159952799479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,4,power_law_1.2,11.664588928222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,balanced,0.30560533205668133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,4,power_law_1.2,0.19662079811096192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,balanced,0.37519999345143634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,4,power_law_1.2,0.20873599052429198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,balanced,0.3708053429921468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,4,power_law_1.2,0.2188416004180908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,balanced,0.35979731877644855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,balanced,0.36443201700846356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,4,power_law_1.2,0.23272960186004638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,balanced,0.36477867762247723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,4,power_law_1.2,0.24897279739379882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,balanced,0.3676746686299642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,4,power_law_1.2,0.258624005317688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,balanced,0.37405868371327716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,4,power_law_1.2,0.28784000873565674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,balanced,0.3733493487040202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,balanced,0.382426659266154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,balanced,0.3943839867909749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,4,power_law_1.2,0.28540160655975344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,balanced,0.4180320103963216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,balanced,0.4352426528930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,4,power_law_1.2,0.308735990524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,balanced,0.495525320370992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,balanced,0.4931573470433553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,4,power_law_1.2,0.3539072036743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,balanced,0.05133866767088572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,balanced,0.6184373299280802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,balanced,0.05835199852784475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,4,power_law_1.2,0.4283775806427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,balanced,0.07645866771539052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,balanced,0.619375983874003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,balanced,0.11993599931399028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,4,power_law_1.2,0.5542463779449462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,balanced,0.18079467614491782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,balanced,0.21318932374318442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,balanced,0.7771360079447428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,4,power_law_1.2,0.6570112228393554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,balanced,0.21997332572937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,balanced,0.2212160031000773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,balanced,0.22362132867177328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,4,power_law_1.2,0.8801088333129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,balanced,0.22535999615987143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,balanced,0.882042646408081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,4,power_law_1.2,1.2416959762573243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,balanced,0.22889065742492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,balanced,0.23362133900324503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,4,power_law_1.2,1.7633407592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,balanced,0.23609066009521484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,4,power_law_1.2,2.096928024291992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,balanced,0.2450773318608602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,balanced,1.3603092829386394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,balanced,0.25711466868718463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,4,power_law_1.2,3.2019840240478517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,balanced,0.2624586621920268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,balanced,0.27618666489919025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,4,power_law_1.2,4.300979232788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,balanced,0.34946131706237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,balanced,0.06567466755708058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,4,power_law_1.2,5.724972915649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,balanced,0.33828266461690265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,balanced,1.5540693600972493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,balanced,0.07177066802978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,balanced,0.423093318939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,balanced,0.08994666735331218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,4,power_law_1.2,9.511417388916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,balanced,0.12771733601888022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,balanced,0.19470399618148804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,balanced,0.45691200097401935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,balanced,0.22895467281341553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,4,power_law_1.2,21.129696655273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,balanced,0.23366934061050415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,balanced,0.6246453523635864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,balanced,0.23690134286880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,balanced,2.4287947018941245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,balanced,0.23966399828592935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,balanced,0.2446133295694987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,balanced,0.7429280281066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.01,0.07578240036964416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,balanced,0.25034133593241376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.01,0.08967040181159973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,balanced,0.2579466700553894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,balanced,0.2651840051015218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.01,0.09029759764671326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,balanced,1.1331413586934407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,balanced,0.27703466018040973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.01,0.1350335955619812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,balanced,0.29307732979456586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.01,0.1782912015914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,balanced,2.906592051188151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.01,0.29219200611114504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.01,0.3072959899902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,balanced,1.3788587252298992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.01,0.31067519187927245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,balanced,0.3089440067609151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.01,0.059001600742340087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.01,0.32334079742431643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.01,0.06769919991493226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.01,0.32071681022644044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.01,0.06744319796562195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.01,0.35032958984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.01,0.09696000218391418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,balanced,2.0589866638183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,balanced,0.3452800114949544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.01,0.3567552089691162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.01,0.12284799814224243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.01,0.3742784023284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.01,0.17738879919052125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,balanced,3.291221300760905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.01,0.3879807949066162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.01,0.19332480430603027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.01,0.39836161136627196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.01,0.19596799612045288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.01,0.42955517768859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.01,0.19674240350723265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,balanced,0.42926931381225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.01,0.4531839847564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.01,0.20364160537719728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.01,0.503385591506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,balanced,0.49139734109242755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,balanced,2.54639466603597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.01,0.22311680316925048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.01,0.5539648056030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.01,0.22527360916137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.01,0.6360703945159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.01,0.2314687967300415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.01,0.6612351894378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,balanced,0.6300479968388876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.01,0.24315519332885743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.01,0.8222528457641601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.01,0.2552000045776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.01,1.0906304359436034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.01,0.26777598857879636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,balanced,0.7601706981658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.01,0.28999040126800535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.01,1.4433535575866698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.01,0.33809919357299806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,balanced,1.1312106450398762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.01,1.9138431549072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,balanced,2.972874641418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.01,0.3546816110610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,balanced,5.356149037679036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.01,2.710374450683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.01,0.44715518951416017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,balanced,1.3946986198425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.01,0.4897024154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.01,3.0221120834350588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.01,0.6320640087127686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.01,3.9412288665771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,power_law_1.01,0.07626240253448487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.01,0.8581503868103028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,power_law_1.01,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.01,1.2130240440368651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,balanced,2.018986701965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.01,5.80882568359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,power_law_1.01,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.01,1.4497152328491212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,power_law_1.01,0.10993280410766601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,power_law_1.01,0.13263360261917115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.01,2.0986047744750977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.01,11.675692749023437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,power_law_1.01,0.19085439443588256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,2,power_law_1.2,0.07570559978485107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,power_law_1.01,0.19790079593658447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.01,2.682579231262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,balanced,2.6353333791097007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,power_law_1.01,0.21043839454650878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,2,power_law_1.2,0.06995840072631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,power_law_1.01,0.21050240993499755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.01,3.3097023010253905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,2,power_law_1.2,0.07890560030937195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,power_law_1.01,0.22807040214538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,power_law_1.01,0.24332799911499023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,2,power_law_1.2,0.12030719518661499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.01,5.793273544311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,balanced,4.787391980489095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,power_law_1.01,0.25783040523529055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,2,power_law_1.2,0.1537343978881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,power_law_1.01,0.27166080474853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,2,power_law_1.2,0.2908096075057983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.01,11.047245025634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,power_law_1.01,0.2925695896148682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,balanced,3.772298812866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,2,power_law_1.2,0.3101248025894165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,power_law_1.01,0.32454400062561034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,2,power_law_1.2,0.3197887897491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,2,power_law_1.2,0.3282304048538208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,power_law_1.01,0.3309119939804077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,2,power_law_1.2,0.3284800052642822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,2,power_law_1.2,0.35640320777893064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,2,power_law_1.2,0.3698944091796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,power_law_1.01,0.3739327907562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,2,power_law_1.2,0.3799168109893799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,2,power_law_1.2,0.40037121772766116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,balanced,4.99945068359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,2,power_law_1.2,0.42232961654663087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,power_law_1.01,0.4678783893585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,2,power_law_1.2,0.438156795501709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,power_law_1.01,0.5470208168029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,2,power_law_1.2,0.4503488063812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,balanced,10.2455202738444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,2,power_law_1.2,0.518342399597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,power_law_1.01,0.6910016059875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,2,power_law_1.2,0.5545663833618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,power_law_1.01,0.8517760276794434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,power_law_1.01,1.1415231704711915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,2,power_law_1.2,0.6658880233764648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,power_law_1.01,1.5104960441589355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,2,power_law_1.2,0.7479167938232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,power_law_1.01,2.0314048767089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,2,power_law_1.2,0.9300224304199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,balanced,6.080319722493489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,power_law_1.01,2.740345573425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,2,power_law_1.2,1.182271957397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,power_law_1.01,4.131935882568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,2,power_law_1.2,1.492140769958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,power_law_1.01,5.406777572631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,2,power_law_1.2,2.001369667053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,power_law_1.01,6.829670715332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,2,power_law_1.2,3.054284858703613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,power_law_1.01,10.716915130615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,2,power_law_1.2,3.6113727569580076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,balanced,9.497519810994467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,2,power_law_1.2,4.5037696838378904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,power_law_1.01,20.80446014404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,2,power_law_1.2,7.4494140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,2,power_law_1.2,12.972262573242187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,balanced,9.863930384318033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,2,power_law_1.2,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,2,power_law_1.2,0.05728639960289002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,2,power_law_1.2,0.06746240258216858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,2,power_law_1.2,0.09364479780197144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,2,power_law_1.2,0.11397759914398194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,2,power_law_1.2,0.17864320278167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,2,power_law_1.2,0.18735359907150267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,2,power_law_1.2,0.19127680063247682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,2,power_law_1.2,0.20341119766235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,2,power_law_1.2,0.21552639007568358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,2,power_law_1.2,0.22291839122772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,2,power_law_1.2,0.23442559242248534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,2,power_law_1.2,0.2445375919342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,2,power_law_1.2,0.24499199390411378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,2,power_law_1.2,0.2627968072891235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,2,power_law_1.2,0.27968640327453614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,2,power_law_1.2,0.29585919380187986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,2,power_law_1.2,0.3428544044494629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,2,power_law_1.2,0.37015039920806886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,2,power_law_1.2,0.43880319595336914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,2,power_law_1.2,0.5082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,2,power_law_1.2,0.6719615936279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,2,power_law_1.2,0.8891008377075196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,balanced,19.51795196533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,2,power_law_1.2,1.2569600105285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,2,power_law_1.2,1.5801216125488282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,2,power_law_1.2,2.268044853210449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,2,power_law_1.2,3.0414976119995116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,2,power_law_1.2,3.7462848663330077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,2,power_law_1.2,5.680160140991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,2,power_law_1.2,10.998937225341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,2,power_law_1.2,0.07603840231895446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,2,power_law_1.2,0.07120000123977661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,2,power_law_1.2,0.0800704002380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,2,power_law_1.2,0.10366719961166382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,balanced,0.06750933329264323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,2,power_law_1.2,0.12268799543380737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,balanced,0.08233066896597545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,2,power_law_1.2,0.18448640108108522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,balanced,0.11243200302124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,2,power_law_1.2,0.2021183967590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,balanced,0.1797013282775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,balanced,0.31245332956314087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,2,power_law_1.2,0.21249918937683104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,balanced,0.37832534313201904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,2,power_law_1.2,0.22223360538482667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,balanced,0.38338665167490643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,2,power_law_1.2,0.22967679500579835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,balanced,0.3835039933522542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,balanced,0.38763201236724854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,2,power_law_1.2,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,balanced,0.39266665776570636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,2,power_law_1.2,0.267577600479126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,balanced,0.39662400881449383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,2,power_law_1.2,0.2827136039733887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,balanced,0.40594132741292316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,balanced,0.4111040035883586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,2,power_law_1.2,0.2974208116531372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,balanced,0.4220053354899089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,balanced,0.055770665407180786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,2,power_law_1.2,0.3233151912689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,balanced,0.06582933167616527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,balanced,0.4359946648279826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,balanced,0.08530132969220479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,balanced,0.4498080015182495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,balanced,0.13182933131853738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,2,power_law_1.2,0.33305599689483645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,balanced,0.20931732654571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,balanced,0.47042131423950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,balanced,0.24551467100779215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,balanced,0.5841066837310791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,balanced,0.25272534290949505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,2,power_law_1.2,0.39497599601745603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,balanced,0.2507573366165161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,balanced,0.5662453174591064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,balanced,0.25404266516367596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,balanced,0.25756800174713135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,balanced,0.7246026992797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,2,power_law_1.2,0.4653312206268311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,balanced,0.2615306576093038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,balanced,0.26548266410827637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,2,power_law_1.2,0.5472959995269775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,balanced,0.8345440228780111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,balanced,0.27269333600997925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,balanced,0.28466665744781494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,2,power_law_1.2,0.7488128185272217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,balanced,0.3012053370475769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,balanced,1.1894346872965496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,2,power_law_1.2,0.9033791542053222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,balanced,0.3204853336016337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,balanced,0.09503466884295146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.0662335991859436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,2,power_law_1.2,1.238259220123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,balanced,0.341050664583842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,balanced,0.10249066352844238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.07180160284042358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.05255680084228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,balanced,1.3285919825236003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,2,power_law_1.2,1.6184000015258788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,balanced,0.4668906529744466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,balanced,0.12343999743461609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.09281280040740966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.059513598680496216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,2,power_law_1.2,2.2327871322631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,balanced,0.16966933012008667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,balanced,0.434986670811971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.1378559947013855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.07303680181503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,balanced,0.24038932720820108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.18477439880371094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,2,power_law_1.2,3.1328895568847654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,balanced,0.5350506703058878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,balanced,0.2810773253440857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,balanced,2.1925759315490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.10684800148010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.30001919269561766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,balanced,0.2898719906806946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.13400319814682007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,2,power_law_1.2,4.269247817993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.31794559955596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,balanced,0.6196959813435873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,balanced,0.2943039933840434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.20607359409332277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.3264512062072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,2,power_law_1.2,5.948966217041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,balanced,0.30246400833129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.20940799713134767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.3386751890182495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.21804161071777345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,balanced,0.30910933017730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,balanced,0.9782293637593588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,balanced,2.5654613176981607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,2,power_law_1.2,7.231385803222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.34517760276794435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.23677439689636232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,balanced,0.31938133637110394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,balanced,0.3344159921010335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.35190401077270506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.23909120559692382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,balanced,0.34770667552948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.3784064054489136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.25880959033966067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,2,power_law_1.2,12.398143768310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,balanced,1.1568000316619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.2746495962142944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.3896127939224243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,balanced,0.37481598059336346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.28885760307312014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.40327677726745603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,balanced,0.4078559875488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.2898175954818726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.4525951862335205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,2,power_law_1.2,22.427763366699217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.3219007968902588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,balanced,4.024245262145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,balanced,1.782090663909912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.464844799041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.4880256175994873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.37093119621276854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.5843840122222901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.01,0.4531775951385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,balanced,0.4532586733500163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.5895743846893311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,0.4747456073760986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.7197055816650391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,0.5825920104980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,balanced,2.2275892893473306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.878604793548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.01,1.150822353363037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,0.6926400184631347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.01,1.538924789428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,0.9076479911804199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,balanced,0.5133493343989054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.01,2.116511917114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,1.180121612548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,balanced,4.613199869791667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.01,2.6159168243408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,1.666771125793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.01,3.9507007598876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,balanced,3.30841064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,2.1691776275634767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.01,4.959584045410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,3.2093952178955076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,balanced,0.6675360202789307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,4.132371139526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.01,6.09283218383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,balanced,0.7857600053151449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.01,5.198835372924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,balanced,1.042629321416219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.01,9.121804809570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.01,8.22875518798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,balanced,1.2847999731699626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,balanced,5.669866561889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.01,17.850918579101563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,balanced,4.050575892130534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.01,16.41651153564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,balanced,1.9549439748128254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,power_law_1.01,0.08416640162467956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,power_law_1.01,0.09566720128059387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,balanced,2.4297919273376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,power_law_1.01,0.10746879577636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.06459519863128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,power_law_1.01,0.13787519931793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.06880000233650208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,power_law_1.01,0.16535040140151977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,balanced,3.559370676676432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.09048960208892823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,power_law_1.01,0.23343360424041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.12725759744644166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,power_law_1.01,0.2523776054382324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,balanced,4.880256017049153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.16984319686889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,power_law_1.01,0.26375041007995603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,balanced,4.689093271891276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.28970239162445066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,power_law_1.01,0.27489919662475587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.31296000480651853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,power_law_1.01,0.28757760524749754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,balanced,8.594581604003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.3321791887283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.3464960098266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,power_law_1.01,0.31106560230255126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.36090240478515623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,power_law_1.01,0.3370176076889038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.36417279243469236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,power_law_1.01,0.35715839862823484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,balanced,6.736154556274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.3932096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,power_law_1.01,0.4034560203552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.4152703762054443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,power_law_1.01,0.45790719985961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.44045438766479494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.45102720260620116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,power_law_1.01,0.4858816146850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.4701375961303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,balanced,7.747392018636067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.49320321083068847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.596608018875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,power_law_1.01,0.5504447937011718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,balanced,8.948298772176107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.6032320022583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.7337855815887451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,power_law_1.01,0.6752575874328614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.8893759727478028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.01,0.8090944290161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,1,power_law_1.2,1.1842047691345214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.01,1.087615966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,1,power_law_1.2,1.5821439743041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.01,1.3505472183227538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,1,power_law_1.2,2.189414405822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.01,1.875142478942871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,1,power_law_1.2,2.710419273376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.01,2.421855926513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,1,power_law_1.2,3.997555160522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,balanced,10.967503865559896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.01,3.4953536987304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,1,power_law_1.2,5.080307388305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.01,4.5759742736816404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,1,power_law_1.2,6.353542327880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.01,6.714227294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,1,power_law_1.2,9.134349060058593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.01,8.8652099609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,balanced,17.126383463541668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.01,10.987929534912109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,1,power_law_1.2,17.721133422851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,power_law_1.01,17.405010986328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,power_law_1.01,34.71707458496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,balanced,17.439594268798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,balanced,16.138987223307293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.05380480289459229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.07058560252189636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.10042239427566528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.12357759475708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.19630719423294068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.21660161018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.22927360534667968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.2386176109313965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.24766080379486083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.2596224069595337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.2805056095123291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.29402239322662355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.2980544090270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.3178368091583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,balanced,0.08794132868448894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.33646719455718993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.374726390838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,balanced,0.08734933535257976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,balanced,34.96131134033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,1,power_law_1.2,0.44879999160766604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,balanced,0.10251200199127197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,1,power_law_1.2,0.08479999899864196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,0.48076162338256834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,balanced,0.1564533313115438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,balanced,0.26628265778223675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,1,power_law_1.2,0.09630079865455628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,0.5918015956878662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,balanced,0.5002986590067545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,1,power_law_1.2,0.10609920024871826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,0.6937024116516113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,balanced,0.7273866335550944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,1,power_law_1.2,0.13162239789962768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,balanced,0.7261333465576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,0.9298687934875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,1,power_law_1.2,0.1564288020133972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,balanced,0.7262293497721354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,1,power_law_1.2,0.23159680366516114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,1.1919103622436524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,balanced,0.7255199750264486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,1,power_law_1.2,0.25824000835418703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,1.7027263641357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,1,power_law_1.2,0.26657919883728026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,balanced,0.7247786521911621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,1,power_law_1.2,0.284172797203064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,balanced,0.7215253512064616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,2.2120384216308593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,1,power_law_1.2,0.3023423910140991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,balanced,0.7232480049133301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,3.2906238555908205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,1,power_law_1.2,0.31923201084136965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,balanced,0.7277759710947672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,1,power_law_1.2,0.3425152063369751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,4.189324951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,balanced,0.7351146539052328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,1,power_law_1.2,0.37034239768981936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,balanced,0.7376586596171061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,1,power_law_1.2,5.298348617553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,1,power_law_1.2,0.4130112171173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,1,power_law_1.2,0.4642752170562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,balanced,0.7463573614756266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,1,power_law_1.2,8.142675018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,balanced,0.7574986616770426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,balanced,0.7906986872355143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,1,power_law_1.2,0.49529600143432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,1,power_law_1.2,16.01197509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,balanced,0.8148799737294515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,1,power_law_1.2,0.5564735889434814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,balanced,0.8391786416371664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,balanced,0.8806560039520264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,1,power_law_1.2,0.6944064140319824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.2,0.8193535804748535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.2,1.103110408782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,balanced,0.9442666371663412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.2,1.3734463691711425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.2,1.9043136596679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.2,2.4249664306640626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,balanced,1.020026683807373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.2,3.5037952423095704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.2,4.599494552612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.2,6.755046081542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,balanced,1.159663995107015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.2,8.89715805053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.2,11.083634948730468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,balanced,0.06088533500830332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,1,power_law_1.2,17.60968933105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,balanced,1.3274346987406414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,balanced,0.06234666705131531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,balanced,0.07258666555086772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,balanced,0.10390399893124898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,1,power_law_1.2,34.9318603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,balanced,0.16241066654523215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,balanced,0.275706668694814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,balanced,0.3912959893544515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.01,0.2882368087768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,balanced,0.3925653298695882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.17521920204162597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,balanced,0.39188798268636066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.01,0.5010816097259522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,balanced,0.06063466767470042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,balanced,0.39376533031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,balanced,1.6894933382670085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.01,0.7160064220428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.01,0.2731712102890015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,balanced,0.05786666770776113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,balanced,0.40032533804575604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.01,0.17768319845199584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,balanced,0.07679999868075053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.01,0.3818176031112671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,balanced,0.40275200208028156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.01,0.2549567937850952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,balanced,0.11385599772135417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.01,0.40023040771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,balanced,0.40299733479817706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.01,0.1159551978111267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,balanced,0.18112534284591675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.01,0.44766721725463865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,balanced,0.4041759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.01,0.17030400037765503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.01,0.5299456119537354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,balanced,0.27024000883102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,balanced,0.4129600127538045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.01,0.5524928092956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,balanced,0.38490132490793866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.01,0.22554240226745606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,balanced,0.417738676071167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.01,0.5595263957977294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,balanced,0.38628268241882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,balanced,0.3877013524373372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,balanced,0.42662398020426434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.01,0.5858560085296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.01,0.2663039922714233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,balanced,0.3887893358866374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.01,0.6142335891723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,balanced,2.1651253700256348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,balanced,0.4428639809290568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,balanced,0.3914773464202881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.01,0.5929344177246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.01,0.29144959449768065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,balanced,0.39470934867858887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,balanced,0.4599999984105428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.01,0.6547520160675049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,balanced,0.397216002146403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.01,0.6384640216827393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.01,0.298304009437561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,balanced,0.4881440003712972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.01,0.6746367931365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,balanced,0.40053868293762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.01,0.3048831939697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.01,0.6983039855957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,balanced,0.41007999579111737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,balanced,0.5173813501993815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.01,0.8129152297973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.01,0.2996543884277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,balanced,0.4115519920984904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.01,0.746943998336792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,balanced,0.4224693377812703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.01,0.3433216094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,balanced,0.571674664815267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.01,0.8947392463684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,balanced,0.44225601355234784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.01,0.34552960395812987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.01,0.9893055915832519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.01,0.35662720203399656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.01,1.164076805114746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,balanced,0.636303981145223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.01,1.1380415916442872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.01,0.35905280113220217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.01,1.4506879806518556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.01,0.3805376052856445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,balanced,0.4609813292821248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.01,0.3863231897354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.01,1.6630144119262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,balanced,0.7364853223164877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.01,0.43018879890441897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,balanced,3.0953919092814126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.01,2.3090944290161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,0.4561024188995361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.01,2.639756774902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,0.5393599987030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.01,3.4317569732666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,balanced,0.8840800126393636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,0.5709824085235595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,0.6990335941314697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.01,5.062649536132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,0.7327360153198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,balanced,0.49420801798502606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,0.9529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,power_law_1.01,0.1851456046104431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.01,9.861446380615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,1.1188608169555665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,power_law_1.01,0.27691519260406494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,balanced,0.5286453167597452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,1.5862848281860351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,balanced,1.1028640270233154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,power_law_1.01,0.38572158813476565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,1.9818239212036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,power_law_1.01,0.13006720542907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,balanced,0.5957440137863159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.01,2.5061504364013674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,power_law_1.01,0.17674880027770995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,power_law_1.01,0.22456960678100585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.01,3.906969451904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,power_law_1.01,0.2531519889831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.01,8.118624114990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,power_law_1.01,0.30576000213623045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,balanced,1.439743995666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,power_law_1.01,0.2996992111206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,balanced,0.6785386403401693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,power_law_1.01,0.33701119422912595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,16,power_law_1.2,0.26166400909423826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,power_law_1.01,0.3173759937286377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,power_law_1.01,0.3430720090866089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,16,power_law_1.2,0.5013055801391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,balanced,0.8160479863484701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,power_law_1.01,0.3354880094528198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,16,power_law_1.2,0.3705471992492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,power_law_1.01,0.3643712043762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,16,power_law_1.2,0.1909183979034424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,power_law_1.01,0.4009856224060059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,16,power_law_1.2,0.2660736083984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,power_law_1.01,0.4147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,balanced,1.0920906861623128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,power_law_1.01,0.45135998725891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,16,power_law_1.2,0.3585088014602661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,balanced,1.7993067105611165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,power_law_1.01,0.5219456195831299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,16,power_law_1.2,0.37776000499725343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,balanced,5.83189328511556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,16,power_law_1.2,0.5458176136016846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.01,0.5417727947235107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,16,power_law_1.2,0.5500095844268799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,16,power_law_1.2,0.5263872146606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,balanced,1.3693226178487141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.01,0.5665023803710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,16,power_law_1.2,0.5597184181213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.01,0.6485311985015869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.01,0.8428223609924317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,16,power_law_1.2,0.5782591819763183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,16,power_law_1.2,0.5727424144744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.01,0.9196415901184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,16,power_law_1.2,0.6392831802368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.01,1.283084774017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,16,power_law_1.2,0.6485119819641113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.01,1.5924032211303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,balanced,1.875823974609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,16,power_law_1.2,0.614905595779419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,balanced,2.6605920791625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.01,2.293049621582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,16,power_law_1.2,0.6748223781585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.01,2.973311996459961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,16,power_law_1.2,0.8134847640991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,power_law_1.01,3.5843135833740236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,16,power_law_1.2,0.9155712127685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,power_law_1.01,5.586022567749024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,16,power_law_1.2,1.0805631637573243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,16,power_law_1.2,1.1434623718261718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,power_law_1.01,11.186860656738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,16,power_law_1.2,1.4346048355102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,balanced,2.3763465881347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,16,power_law_1.2,1.3668416023254395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.17463680505752563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,16,power_law_1.2,1.810380744934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,16,power_law_1.2,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,16,power_law_1.2,1.9397119522094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,16,power_law_1.2,0.16143360137939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,16,power_law_1.2,2.5392831802368163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,16,power_law_1.2,0.11989120244979859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,16,power_law_1.2,0.15783679485321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,16,power_law_1.2,3.3136001586914063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,16,power_law_1.2,0.20339839458465575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,16,power_law_1.2,4.683097457885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,16,power_law_1.2,0.22403841018676757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,16,power_law_1.2,0.31020159721374513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,16,power_law_1.2,7.27886734008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,16,power_law_1.2,0.2834815979003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,16,power_law_1.2,0.29268479347229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,16,power_law_1.2,14.695808410644531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,16,power_law_1.2,0.33223040103912355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,balanced,3.6727094650268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,16,power_law_1.2,0.3297919988632202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,16,power_law_1.2,0.3433216094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,16,power_law_1.2,0.34961280822753904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,16,power_law_1.2,0.3750335931777954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,16,power_law_1.2,0.40931200981140137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,16,power_law_1.2,0.3975359916687012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,balanced,5.094906806945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,16,power_law_1.2,0.4489471912384033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,0.49346561431884767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,0.5760511875152587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,0.6560383796691894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,0.8200192451477051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,0.856499195098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,1.0817279815673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,1.4307392120361329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,1.9018367767333983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,2.5519744873046877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,16,power_law_1.2,3.1079679489135743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,16,power_law_1.2,4.335782241821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,16,power_law_1.2,10.181798553466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,balanced,0.06957866748174031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,balanced,7.205514907836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,balanced,0.07256000240643819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,balanced,0.0990559955437978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,balanced,0.15647466977437338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,balanced,0.2689653237660726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,16,power_law_1.2,0.1657920002937317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,balanced,0.4999093214670817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,16,power_law_1.2,0.2772864103317261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,balanced,0.7252853711446127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,16,power_law_1.2,0.2512128114700317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,balanced,0.728874683380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,balanced,0.7254079977671305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,16,power_law_1.2,0.10732159614562989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,balanced,0.7311999797821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,16,power_law_1.2,0.16939519643783568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,balanced,0.7225066820780436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,16,power_law_1.2,0.19363839626312257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,balanced,0.7278186480204264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,balanced,0.7263573010762533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,16,power_law_1.2,0.22069759368896485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,balanced,0.7310187021891276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,16,power_law_1.2,0.30164480209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,balanced,0.7410133679707845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,16,power_law_1.2,0.303219199180603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,balanced,0.7444372971852621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,balanced,0.053173333406448364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,balanced,0.7546453475952148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,16,power_law_1.2,0.31254398822784424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,balanced,0.7732053597768148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,balanced,0.0568800022204717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,16,power_law_1.2,0.3051071882247925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,balanced,0.807370662689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,balanced,0.07146666447321574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,16,power_law_1.2,0.33448960781097414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,balanced,0.10492266217867534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,balanced,0.8400426705678304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,balanced,0.1634773313999176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,16,power_law_1.2,0.34186880588531493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,balanced,0.8644266923268636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,balanced,0.27702399094899494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,16,power_law_1.2,0.36942079067230227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,balanced,0.39217066764831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,16,power_law_1.2,0.3987519979476929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,balanced,0.9171679814656576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,balanced,0.39447466532389325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,16,power_law_1.2,0.4300864219665527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,balanced,0.39552001158396405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,16,power_law_1.2,0.44048638343811036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,balanced,0.9895733197530111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,balanced,0.3983786503473918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,16,power_law_1.2,0.5605311870574952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,balanced,0.3996479908625285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,balanced,0.40164800484975177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,balanced,1.1021333535512288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,balanced,0.4055253267288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.2,0.5609920024871826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,balanced,0.41065601507822674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,balanced,0.42209064960479736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,balanced,0.42626134554545086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.2,0.5863872051239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,balanced,1.2551360130310059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,balanced,0.43378134568532306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.2,0.6903295993804932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,balanced,0.45501331488291424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.2,0.9388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,balanced,0.47040001551310223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.2,1.079315185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,balanced,0.5076853434244791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,balanced,1.4843573570251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.2,1.493894386291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,balanced,0.5421653191248575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.2,1.9406335830688477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.2,2.626905632019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,balanced,0.6161439816157023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.2,3.713356781005859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,16,power_law_1.2,4.519622421264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,balanced,0.6914560000101725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.01,0.17467520236968995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,balanced,1.9068320592244465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,balanced,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,16,power_law_1.2,7.848384094238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.01,0.26625919342041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,balanced,0.06285333136717479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.01,0.48988800048828124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,balanced,0.8264586925506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,balanced,0.07428800066312154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.01,0.16164480447769164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,balanced,0.11558933059374492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,16,power_law_1.2,14.9510009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,balanced,0.18357867002487183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.01,0.266048002243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,balanced,0.2752373417218526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,balanced,0.387231985727946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.01,0.3484287977218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,balanced,0.389141321182251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,balanced,0.9906666278839111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.01,0.43657598495483396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,balanced,0.3914773464202881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.01,0.10933120250701904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,balanced,0.3922400077184041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.01,0.49904642105102537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,balanced,0.3952639897664388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,balanced,2.4255146980285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.01,0.15541759729385377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.01,0.5454912185668945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,balanced,0.3991573254267375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.01,0.2702080011367798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,balanced,0.40325868129730225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.01,0.5550464153289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,balanced,0.4087253411610921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.01,0.10378880500793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.01,0.5636159896850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,balanced,0.4209973414738973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,balanced,1.265168031056722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.01,0.14919040203094483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,balanced,0.42508800824483234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.01,0.5915008068084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,balanced,0.43881599108378094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.01,0.20146560668945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.01,0.5811520099639893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,balanced,0.4635946750640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.01,0.2272576093673706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.01,0.6202239990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.01,0.27127680778503416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.01,0.2830847978591919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.01,0.6324672222137451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.01,0.30046720504760743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.01,0.6542784214019776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,balanced,0.4859413305918376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.01,0.3132672071456909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.01,0.6761663913726806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,balanced,1.6609172821044922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.01,0.31722240447998046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.01,0.7067967891693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.01,0.31831679344177244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.01,0.7794943809509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,balanced,3.4947945276896157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.01,0.35495040416717527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.01,0.8544704437255859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.01,0.3731264114379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.01,0.9570431709289551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.01,1.186899185180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.01,0.38421120643615725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.01,0.3873408079147339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,balanced,0.5477279822031657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.01,1.0809087753295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.01,0.41902718544006345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.01,1.3229248046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,balanced,0.6073973178863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,balanced,2.0701173146565757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,8,power_law_1.2,0.17519999742507936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.01,0.4386879920959473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.01,1.6582847595214845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.01,0.5348415851593018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,8,power_law_1.2,0.266374397277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,balanced,0.7049012978871664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.01,2.1167743682861326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,8,power_law_1.2,0.24581120014190674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.01,0.5660607814788818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,power_law_1.01,0.11422079801559448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,8,power_law_1.2,0.15086719989776612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.01,0.6898176193237304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.01,2.775596809387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,balanced,0.8238773345947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,power_law_1.01,0.17293440103530883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,8,power_law_1.2,0.21894400119781493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.01,0.7595392227172851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.01,3.361337661743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,8,power_law_1.2,0.3247423887252808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,power_law_1.01,0.2817023992538452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.01,0.9673983573913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,balanced,1.0216426849365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.01,4.637760162353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,8,power_law_1.2,0.36865279674530027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,power_law_1.01,0.11167999505996704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.01,1.1911871910095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,8,power_law_1.2,0.5064127922058106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,power_law_1.01,0.16428799629211427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.01,1.6297536849975587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.01,9.54567642211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,8,power_law_1.2,0.5030335903167724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,power_law_1.01,0.21353600025177003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.01,2.0534912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,8,power_law_1.2,0.543455982208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,balanced,1.3831146558125813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,power_law_1.01,0.22079360485076904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.01,2.4859392166137697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,8,power_law_1.2,0.5627327919006347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,power_law_1.01,0.30002560615539553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,8,power_law_1.2,0.6035007953643798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,balanced,3.039226531982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.01,3.7089153289794923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,power_law_1.01,0.2977344036102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,8,power_law_1.2,0.5817855834960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,power_law_1.01,0.3156735897064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.01,7.619161224365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,8,power_law_1.2,0.6284607887268067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,balanced,1.7923253377278645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,power_law_1.01,0.3131200075149536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,8,power_law_1.2,0.6286464214324952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,power_law_1.01,0.3251136064529419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,balanced,6.81379763285319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,8,power_law_1.2,0.658784008026123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,power_law_1.01,0.35542399883270265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,8,power_law_1.2,0.6800576210021972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,power_law_1.01,0.36027519702911376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,8,power_law_1.2,0.6972032070159913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,power_law_1.01,0.4156032085418701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,8,power_law_1.2,0.7843520164489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,balanced,2.4251999855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,power_law_1.01,0.4175424098968506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,8,power_law_1.2,0.9631360054016114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,power_law_1.01,0.43100800514221194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,8,power_law_1.2,1.02291841506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,power_law_1.01,0.5065919876098632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,8,power_law_1.2,1.2072704315185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,8,power_law_1.2,1.2089983940124511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,8,power_law_1.2,1.4828415870666505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,power_law_1.01,0.5534783840179444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,8,power_law_1.2,1.7716287612915038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,balanced,3.0581385294596353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,power_law_1.01,0.5832511901855468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,8,power_law_1.2,2.33121280670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,power_law_1.01,0.7160064220428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,8,power_law_1.2,2.9195199966430665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,power_law_1.01,0.8582847595214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,8,power_law_1.2,4.284966278076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,power_law_1.01,1.0028608322143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,power_law_1.01,1.333670425415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,8,power_law_1.2,4.9744384765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,power_law_1.01,1.7840639114379884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,balanced,5.848154703776042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,8,power_law_1.2,10.849958038330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,power_law_1.01,2.5568832397460937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,power_law_1.01,3.357260894775391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,power_law_1.01,4.573612976074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,balanced,4.786442756652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,power_law_1.01,6.6637825012207035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,power_law_1.01,13.191392517089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,8,power_law_1.2,0.10888960361480712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,8,power_law_1.2,0.1548416018486023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,8,power_law_1.2,0.16781439781188964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,8,power_law_1.2,0.09630720019340515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,8,power_law_1.2,0.15047039985656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,8,power_law_1.2,0.17536640167236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,8,power_law_1.2,0.20115840435028076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,8,power_law_1.2,0.26305279731750486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,8,power_law_1.2,0.2908992052078247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,8,power_law_1.2,0.2822655916213989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,8,power_law_1.2,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,8,power_law_1.2,0.3133631944656372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,8,power_law_1.2,0.3204927921295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,8,power_law_1.2,0.3639679908752441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,8,power_law_1.2,0.372761607170105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,8,power_law_1.2,0.36329600811004636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,8,power_law_1.2,0.38928000926971434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,balanced,9.324890772501627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,8,power_law_1.2,0.43582720756530763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,8,power_law_1.2,0.4638656139373779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,8,power_law_1.2,0.593459177017212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,8,power_law_1.2,0.6047743797302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,8,power_law_1.2,0.7800704002380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,8,power_law_1.2,0.8175552368164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,8,power_law_1.2,1.1160703659057618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,8,power_law_1.2,1.3141440391540526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,8,power_law_1.2,1.7755775451660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,8,power_law_1.2,2.3223808288574217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,8,power_law_1.2,0.12081279754638671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,8,power_law_1.2,2.6229312896728514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,8,power_law_1.2,0.16901760101318358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,8,power_law_1.2,4.316582489013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,8,power_law_1.2,0.1415488004684448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,8,power_law_1.2,0.10968320369720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,8,power_law_1.2,9.298982238769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,8,power_law_1.2,0.14840320348739625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,balanced,0.06410666803518932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,balanced,0.051274667183558144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,8,power_law_1.2,0.19717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,balanced,0.05791999896367391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,balanced,0.09921600421269734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,8,power_law_1.2,0.22193920612335205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,balanced,0.07298133273919423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,balanced,0.16062933206558228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,8,power_law_1.2,0.2806528091430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,balanced,0.10638933380444844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,balanced,0.2703733245531718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,8,power_law_1.2,0.2795711994171143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,balanced,0.1660106678803762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,balanced,0.50545601050059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,balanced,0.2821386655171712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,8,power_law_1.2,0.2927488088607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,balanced,0.7328480084737142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,balanced,0.39846400419871014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,8,power_law_1.2,0.30554239749908446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,balanced,0.7321440378824869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,balanced,0.4012053410212199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,8,power_law_1.2,0.34140160083770754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,balanced,0.7383573055267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,balanced,0.40343467394510907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,8,power_law_1.2,0.34126720428466795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,balanced,0.738864024480184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,balanced,0.40269867579142254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,balanced,0.40513598918914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,balanced,0.7320640087127686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,8,power_law_1.2,0.36867198944091795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,balanced,0.4123573303222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,balanced,0.7369813124338785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,8,power_law_1.2,0.3854016065597534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,balanced,0.41625599066416424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,balanced,0.738970677057902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,8,power_law_1.2,0.41098880767822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,balanced,0.4177279869715373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,balanced,0.7500426769256592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,balanced,0.43200000127156574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,8,power_law_1.2,0.4525887966156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,balanced,0.7608319918314616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,balanced,0.43692266941070557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,8,power_law_1.2,0.5341824054718017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,balanced,0.7648746967315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,balanced,0.44766398270924884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,balanced,0.773535966873169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,balanced,0.4716106653213501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,8,power_law_1.2,0.5623487949371337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,balanced,0.7948266665140787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,balanced,0.4961920181910197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,balanced,0.8299360275268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,balanced,0.5426826477050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,8,power_law_1.2,0.6360832214355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,balanced,0.8704480330149332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,8,power_law_1.2,0.727839994430542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,balanced,0.5996426741282145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,balanced,0.9237706661224365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,8,power_law_1.2,0.9782912254333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,balanced,0.6914079984029134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,8,power_law_1.2,1.159443187713623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,balanced,1.0168320337931316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,8,power_law_1.2,1.4365247726440429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.01,0.10954240560531617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,balanced,0.7942933241526285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,8,power_law_1.2,1.911942481994629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,balanced,1.1173493067423503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.01,0.15401599407196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,8,power_law_1.2,2.8375295639038085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.01,0.26733438968658446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,8,power_law_1.2,3.5625728607177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,balanced,0.9932640393575033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.01,0.13343360424041747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,balanced,1.2965226968129475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,8,power_law_1.2,4.745126342773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.01,0.2371903896331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.01,0.07626879811286927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,balanced,0.06805333495140076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.01,0.3139136075973511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.01,0.1018496036529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,8,power_law_1.2,7.8401023864746096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,balanced,0.07724266747633617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,balanced,1.2182186444600422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.01,0.3935103893280029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.01,0.16047999858856202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,balanced,0.09099200367927551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,balanced,1.4994559288024902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.01,0.5209663867950439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.01,0.09543039798736572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,balanced,0.12463466326395671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,8,power_law_1.2,16.168333435058592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.01,0.5274240016937256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,balanced,0.19290665785471597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.01,0.14249600172042848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.01,0.5194367885589599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,balanced,0.29234133164087933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.01,0.201363205909729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,balanced,0.40692798296610516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.01,0.5654079914093018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,balanced,0.4098506768544515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.01,0.22558081150054932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,balanced,1.6234666506449382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.01,0.6018303871154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,balanced,0.4118080139160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.01,0.28475520610809324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,balanced,1.8497014045715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,balanced,0.4155999819437663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.01,0.6020351886749268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.01,0.2871232032775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,balanced,0.41915734608968097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.01,0.6230271816253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,balanced,0.42617066701253253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.01,0.3058687925338745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,balanced,0.43051199118296307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.01,0.6476672172546387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.01,0.31715199947357176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,balanced,0.4395893414815267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.01,0.6527679920196533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.01,0.3398591995239258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,balanced,0.45449066162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.01,0.3290623903274536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.01,0.6785215854644775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,balanced,2.065290609995524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,balanced,0.46163733800252277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.01,0.35262720584869384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.01,0.73023362159729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,balanced,2.3184372584025064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,balanced,0.478928009668986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.01,0.3625216007232666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.01,0.7777279853820801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.01,0.3905087947845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,balanced,0.5199040174484253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.01,0.8832703590393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.01,0.40316162109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.01,0.9320192337036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.01,0.4371776103973389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.01,0.4839168071746826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.01,1.1092032432556151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.01,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.01,1.1378111839294434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,balanced,0.5727413495381674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.01,0.6233471870422364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.01,1.3755264282226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.01,0.7713280200958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,balanced,2.587242603302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.01,1.7936063766479493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.01,0.8955072402954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,balanced,2.9862133661905923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.01,2.301888084411621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.01,1.1719552040100099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,power_law_1.01,0.09699199795722961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.01,1.3500160217285155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.01,2.9568832397460936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,power_law_1.01,0.12287360429763794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.01,1.8205696105957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.01,3.487615966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,power_law_1.01,0.18186880350112916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,balanced,0.6790133317311605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.01,2.2969600677490236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,power_law_1.01,0.10317440032958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.01,4.979840087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.01,2.8401792526245115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,balanced,0.7667360305786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,power_law_1.01,0.1538815975189209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,power_law_1.01,0.19792640209197998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.01,4.371980667114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,power_law_1.01,0.24094719886779786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.01,10.373875427246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,balanced,0.9285120169321696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,power_law_1.01,0.2907776117324829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.01,8.754969787597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,power_law_1.01,0.30323200225830077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,balanced,1.1201972961425781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,power_law_1.01,0.3163520097732544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,4,power_law_1.2,0.09938560128211975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,power_law_1.01,0.33263359069824217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,balanced,3.9667094548543296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,power_law_1.01,0.339897608757019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,balanced,4.304741223653157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,4,power_law_1.2,0.15401599407196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,balanced,1.4455572764078777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,power_law_1.01,0.3670527935028076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,4,power_law_1.2,0.14650239944458007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,power_law_1.01,0.3774336099624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,4,power_law_1.2,0.12563199996948243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,power_law_1.01,0.40677762031555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,4,power_law_1.2,0.2288127899169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,balanced,1.9533920288085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,power_law_1.01,0.42624640464782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,4,power_law_1.2,0.3122688055038452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,power_law_1.01,0.4716928005218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,4,power_law_1.2,0.34974079132080077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,power_law_1.01,0.5601024150848388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,4,power_law_1.2,0.4517695903778076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,4,power_law_1.2,0.47324161529541015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,4,power_law_1.2,0.517580795288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,balanced,2.609562714894613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,4,power_law_1.2,0.550822401046753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,power_law_1.01,0.6131264209747315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,4,power_law_1.2,0.5604864120483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,4,power_law_1.2,0.5998847961425782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,4,power_law_1.2,0.5991615772247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,power_law_1.01,0.7000895977020264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,4,power_law_1.2,0.6303872108459473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,power_law_1.01,0.8375231742858886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,4,power_law_1.2,0.6598400115966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,power_law_1.01,1.0789119720458984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,4,power_law_1.2,0.6874815940856933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,balanced,3.5449546178181968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,power_law_1.01,1.2481023788452148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,4,power_law_1.2,0.7397183895111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,4,power_law_1.2,0.8096192359924317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,power_law_1.01,1.7497343063354491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,4,power_law_1.2,0.8982527732849122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,power_law_1.01,2.3022335052490233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,4,power_law_1.2,1.0017727851867675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,power_law_1.01,3.095795249938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,4,power_law_1.2,1.1838015556335448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,balanced,7.615621566772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,4,power_law_1.2,1.2271488189697266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,power_law_1.01,3.97325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,balanced,8.141263961791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,balanced,4.432741483052571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,4,power_law_1.2,1.497216033935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,power_law_1.01,5.473471832275391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,4,power_law_1.2,1.8142784118652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,power_law_1.01,7.850847625732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,4,power_law_1.2,2.4789312362670897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,4,power_law_1.2,3.1798847198486326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,power_law_1.01,16.084934997558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,4,power_law_1.2,4.1480766296386715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,4,power_law_1.2,5.506886291503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,4,power_law_1.2,12.442527770996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,balanced,6.940842946370442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,4,power_law_1.2,0.07637119889259339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,4,power_law_1.2,0.10063999891281128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,4,power_law_1.2,0.1009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,4,power_law_1.2,0.09296000003814697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,4,power_law_1.2,0.13267199993133544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,4,power_law_1.2,0.18238719701766967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,4,power_law_1.2,0.2021183967590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,4,power_law_1.2,0.27986559867858884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,4,power_law_1.2,0.28752639293670657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,4,power_law_1.2,0.2733567953109741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,4,power_law_1.2,0.312006402015686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,4,power_law_1.2,0.33397760391235354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,4,power_law_1.2,0.3311487913131714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,4,power_law_1.2,0.35100159645080564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,4,power_law_1.2,0.3594304084777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,4,power_law_1.2,0.373088002204895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,4,power_law_1.2,0.4013823986053467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,4,power_law_1.2,0.44888958930969236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,4,power_law_1.2,0.49376640319824217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,4,power_law_1.2,0.5874559879302979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,4,power_law_1.2,0.660038423538208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,4,power_law_1.2,0.79268479347229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,4,power_law_1.2,0.9428544044494629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,4,power_law_1.2,1.1611007690429687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,4,power_law_1.2,1.4212736129760741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,balanced,13.750965118408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,4,power_law_1.2,1.9442047119140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,4,power_law_1.2,2.5798912048339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,4,power_law_1.2,3.197100830078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,4,power_law_1.2,4.770924758911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,balanced,0.06513600051403046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,balanced,0.073253333568573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,4,power_law_1.2,9.098124694824218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,balanced,0.10262399911880493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,balanced,0.16014400124549866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,balanced,0.2868480086326599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,4,power_law_1.2,0.0985535979270935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,balanced,0.527514656384786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,4,power_law_1.2,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,balanced,0.7754186789194742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,4,power_law_1.2,0.11157759428024291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,balanced,0.7786133289337158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,4,power_law_1.2,0.11382399797439575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,balanced,0.7751733462015787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,4,power_law_1.2,0.15044480562210083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,balanced,0.7776640256245931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,4,power_law_1.2,0.17751679420471192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,balanced,0.7612213293711344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,4,power_law_1.2,0.2109760046005249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,4,power_law_1.2,0.27786879539489745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,balanced,0.7701546351114908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,4,power_law_1.2,0.2897279977798462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,balanced,0.7717013359069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,4,power_law_1.2,0.2955647945404053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,balanced,0.7775039672851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,4,power_law_1.2,0.3174207925796509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,balanced,0.7922613620758057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,4,power_law_1.2,0.3440576076507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,balanced,0.793386697769165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,4,power_law_1.2,0.3493567943572998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,balanced,0.8018240133921305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,4,power_law_1.2,0.37909760475158694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,balanced,0.8381706873575846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,4,power_law_1.2,0.4034751892089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,balanced,0.8838559786478678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,4,power_law_1.2,0.436627197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,4,power_law_1.2,0.47603840827941896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,balanced,0.9575733343760172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,4,power_law_1.2,0.6143936157226563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,balanced,1.0629493395487468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,balanced,1.2201653321584065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,4,power_law_1.2,0.6336639881134033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,balanced,1.3680052757263184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,4,power_law_1.2,0.759500789642334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,4,power_law_1.2,0.8738880157470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,balanced,0.0539626677831014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,4,power_law_1.2,1.1942079544067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,balanced,1.6667946179707844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,balanced,0.060218666990598045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,4,power_law_1.2,1.3770496368408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,balanced,0.07718933125336964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,balanced,0.11002666751543681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,4,power_law_1.2,1.8647743225097657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,balanced,0.17250667015711466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,4,power_law_1.2,2.488211250305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,balanced,2.0251466433207193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,balanced,0.29585067431132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,4,power_law_1.2,3.270060729980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,balanced,0.4139839808146159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.01,0.07580159902572632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,balanced,0.41927464803059894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,balanced,0.09897599617640178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,4,power_law_1.2,4.681465530395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,balanced,0.42476268609364826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.01,0.10202879905700683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,balanced,0.10664533575375874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,balanced,0.4270826578140259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,4,power_law_1.2,5.626233673095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.01,0.15627520084381102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,balanced,0.11870933572451274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,balanced,2.7705440521240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,balanced,0.43729599316914874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,balanced,0.1527253290017446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.01,0.12235519886016846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,balanced,0.4448639949162801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,4,power_law_1.2,8.89837417602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,balanced,0.22380266586939493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.01,0.2166719913482666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,balanced,0.45158934593200684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,balanced,0.33181333541870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.01,0.31585919857025146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,balanced,0.4627466599146525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.01,0.0608959972858429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,balanced,0.4594666560490926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,balanced,0.46811731656392414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,4,power_law_1.2,19.611366271972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.01,0.3768320083618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,balanced,0.48044268290201825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,balanced,0.470853328704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.01,0.07488639950752259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,balanced,0.4912853240966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.01,0.47031679153442385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,balanced,0.4738453229268392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,balanced,0.5134826501210531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,balanced,3.4281012217203775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.01,0.10301439762115479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.01,0.512172794342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,balanced,0.48231999079386395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.01,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,balanced,0.5464320182800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.01,0.5209856033325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,balanced,0.4927146832148234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.01,0.1501312017440796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,balanced,0.5732053518295288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,balanced,0.5017173290252686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.01,0.5663040161132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.01,0.1954751968383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,balanced,0.5133119821548462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.01,0.6017024040222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.01,0.21765758991241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,balanced,0.6487893263498942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,balanced,0.5354400078455607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.01,0.2844736099243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.01,0.6211711883544921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.01,0.30222721099853517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,balanced,0.7228586673736572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,balanced,0.5480586687723795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.01,0.6361087799072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.01,0.3079040050506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,balanced,0.5944639841715494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.01,0.6610623836517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.01,0.32641921043395994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,balanced,0.8448639710744222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,balanced,0.6784799893697103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,balanced,4.119039853413899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.01,0.33486080169677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.01,0.6979455947875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.01,0.36360960006713866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.01,0.6910016059875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,balanced,1.0155839920043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.01,0.38248960971832274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.01,0.7457727909088134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.01,0.4158592224121094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.01,0.803872013092041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,balanced,0.7602079709370931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.01,0.4338111877441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.01,0.948089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.01,0.4448383808135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,balanced,1.3395039240519206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.01,1.0241215705871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.01,0.49880318641662597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.01,1.2623744010925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.01,0.5610047817230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.01,1.410912036895752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.01,0.6609792232513427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,balanced,1.6719679832458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.01,1.7151424407958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,balanced,0.9775253136952718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.01,0.7161087989807129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.01,2.284646415710449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.01,0.8836864471435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,balanced,1.1434986591339111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.01,3.1617279052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.01,1.0356800079345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,balanced,6.3649546305338545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.01,3.5331390380859373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,balanced,1.3797653516133626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.01,1.3376255989074708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.01,4.133881759643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.01,1.7955072402954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,balanced,2.3733439445495605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,balanced,1.7821760177612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.01,2.5723007202148436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.01,6.531654357910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.01,2.944576072692871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.01,13.314002990722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.01,3.635539245605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,balanced,2.3054986000061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,power_law_1.01,0.10438400506973267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.01,5.729663848876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,power_law_1.01,0.11724159717559815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,balanced,2.8104321161905923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,power_law_1.01,0.1532096028327942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.01,11.680185699462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,balanced,3.296112060546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,power_law_1.01,0.13292800188064574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,2,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,power_law_1.01,0.1869503974914551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,2,power_law_1.2,0.10188800096511841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,power_law_1.01,0.23180799484252929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,2,power_law_1.2,0.11548800468444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,power_law_1.01,0.2607295989990234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,2,power_law_1.2,0.1315775990486145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,power_law_1.01,0.3222527980804443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,2,power_law_1.2,0.19553279876708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,balanced,4.458698590596517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,power_law_1.01,0.34984960556030276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,2,power_law_1.2,0.2807039976119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,balanced,3.4823732376098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,power_law_1.01,0.364518404006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,2,power_law_1.2,0.33147521018981935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,power_law_1.01,0.3662336111068726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,2,power_law_1.2,0.4698431968688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,power_law_1.01,0.40247039794921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,2,power_law_1.2,0.4996607780456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,power_law_1.01,0.4187327861785889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,2,power_law_1.2,0.500819206237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,2,power_law_1.2,0.5075776100158691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,power_law_1.01,0.45493760108947756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,2,power_law_1.2,0.5623167991638184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,balanced,6.041573206583659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,power_law_1.01,0.47817602157592776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,2,power_law_1.2,0.5664959907531738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,balanced,12.140939076741537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,power_law_1.01,0.5180992126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,2,power_law_1.2,0.6386559963226318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,power_law_1.01,0.5939519882202149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,2,power_law_1.2,0.6784575939178467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,power_law_1.01,0.7394432067871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,2,power_law_1.2,0.6927103996276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,2,power_law_1.2,0.7083136081695557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,2,power_law_1.2,0.7665088176727295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,2,power_law_1.2,0.8637248039245605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,power_law_1.01,0.8091839790344239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,balanced,5.505354563395183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,2,power_law_1.2,0.977177619934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,balanced,7.578512191772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,2,power_law_1.2,1.0926143646240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,power_law_1.01,0.9688511848449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,2,power_law_1.2,1.2806591987609863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,2,power_law_1.2,1.454150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,power_law_1.01,1.1691967964172363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,2,power_law_1.2,1.8050559997558593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,power_law_1.01,1.534553623199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,2,power_law_1.2,2.4886655807495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,power_law_1.01,1.8738943099975587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,2,power_law_1.2,3.4309310913085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,power_law_1.01,2.5610559463500975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,2,power_law_1.2,3.648672103881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,power_law_1.01,3.286105728149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,2,power_law_1.2,4.50964469909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,power_law_1.01,4.998374557495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,2,power_law_1.2,6.843539428710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,power_law_1.01,6.205267333984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,power_law_1.01,7.502758026123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,2,power_law_1.2,13.499827575683593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,balanced,11.834730784098307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,2,power_law_1.2,0.06049280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,power_law_1.01,11.847270202636718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,2,power_law_1.2,0.0743552029132843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,2,power_law_1.2,0.0794368028640747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,2,power_law_1.2,0.09008640050888062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,power_law_1.01,23.984115600585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,2,power_law_1.2,0.12833280563354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,2,power_law_1.2,0.16922880411148072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,2,power_law_1.2,0.20365440845489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,2,power_law_1.2,0.2608191967010498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,2,power_law_1.2,0.28771200180053713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,balanced,11.092491149902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,2,power_law_1.2,0.30227839946746826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,2,power_law_1.2,0.3154239892959595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,2,power_law_1.2,0.33739519119262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,2,power_law_1.2,0.3451839923858643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,2,power_law_1.2,0.3805567979812622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,2,power_law_1.2,0.41632637977600095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,2,power_law_1.2,0.4316351890563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,2,power_law_1.2,0.4554624080657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,2,power_law_1.2,0.5108416080474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,2,power_law_1.2,0.5693952083587647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,2,power_law_1.2,0.6843200206756592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,2,power_law_1.2,0.7468287944793701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,2,power_law_1.2,0.9444031715393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,balanced,23.099385579427082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,2,power_law_1.2,1.0591551780700683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,2,power_law_1.2,1.4242688179016114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,2,power_law_1.2,1.9477760314941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,2,power_law_1.2,0.10421119928359986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,2,power_law_1.2,2.7471168518066404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,2,power_law_1.2,0.11701760292053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,2,power_law_1.2,3.2055233001708983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,2,power_law_1.2,0.12341760396957398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,2,power_law_1.2,0.12669440507888793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,2,power_law_1.2,3.7887168884277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,balanced,0.06968000034491222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,2,power_law_1.2,0.17256959676742553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,balanced,0.08024533092975616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,2,power_law_1.2,0.2165760040283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,2,power_law_1.2,6.461395263671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,balanced,0.1095199982325236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,2,power_law_1.2,0.25460479259490965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,balanced,0.17026132345199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,2,power_law_1.2,0.30901761054992677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,2,power_law_1.2,12.505158233642579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,balanced,0.29427733023961383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,2,power_law_1.2,0.32644479274749755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,balanced,0.5382773478825887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,2,power_law_1.2,0.3405951976776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,balanced,0.7716426849365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,2,power_law_1.2,0.36424961090087893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,balanced,0.7772106329600016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,balanced,0.7814666430155436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,2,power_law_1.2,0.397708797454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,balanced,0.7846826712290446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,2,power_law_1.2,0.41728639602661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,balanced,0.775871992111206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,2,power_law_1.2,0.4532224178314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,balanced,0.06312533219655354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,balanced,0.7875200112660726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,2,power_law_1.2,0.4799232006072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,balanced,0.06770133475462596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,balanced,0.7936320304870605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,2,power_law_1.2,0.5258495807647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,balanced,0.08674133817354839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,balanced,0.13110400239626566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,balanced,0.8017066319783529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,2,power_law_1.2,0.5931583881378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,balanced,0.21183466911315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,balanced,0.3677813212076823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,balanced,0.8150506814320883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,2,power_law_1.2,0.7557568073272705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,balanced,0.5212800105412801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,balanced,0.8235039710998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,balanced,0.5244266589482626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,balanced,0.5341600179672241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,balanced,0.84552534421285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,balanced,0.534608006477356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,2,power_law_1.2,0.8401920318603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,balanced,0.5415573517481486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,balanced,0.9095946947733561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,balanced,0.5509066581726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,balanced,0.9729706446329752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,balanced,0.5648053487141927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,balanced,0.5832800070444742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,2,power_law_1.2,0.9954431533813477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,balanced,1.0944426854451497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,balanced,0.5983146826426188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,2,power_law_1.2,1.1867967605590821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,balanced,0.6166026592254639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,balanced,1.2572800318400066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,2,power_law_1.2,1.660268783569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,balanced,0.6526293357213339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,balanced,0.7033812999725342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,2,power_law_1.2,1.9977855682373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,balanced,1.4940746625264485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,balanced,0.7540373007456461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,2,power_law_1.2,2.695897674560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,balanced,0.8764533201853434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,2,power_law_1.2,3.6104896545410154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,balanced,1.8149174054463704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,balanced,0.9869546890258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,2,power_law_1.2,4.901657485961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,2,power_law_1.2,6.63056640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,balanced,1.1932960351308186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,balanced,2.4384533564249673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,2,power_law_1.2,8.346713256835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,balanced,1.5038293202718098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,2,power_law_1.2,12.138009643554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,balanced,3.075167973836263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,balanced,2.0708373387654624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,2,power_law_1.2,25.2029052734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,balanced,0.1586186687151591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,balanced,2.6556320190429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,balanced,4.401551882425944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,balanced,0.17014400164286295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,balanced,0.1848586599032084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,balanced,0.21619733174641928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.01,0.06258559823036194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,balanced,0.29578665892283124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.06499199867248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.01,0.06314240097999572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,balanced,0.43809600671132404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,balanced,3.8639198939005532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,balanced,0.5923519929250082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.01,0.08354560136795045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.07525119781494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,balanced,0.6035146713256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.01,0.10350079536437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.10537600517272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,balanced,0.6145653327306112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,balanced,5.275349299112956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.01,0.16300159692764282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,balanced,0.623520016670227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.1348031997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.01,0.22580480575561523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,balanced,0.637498656908671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.21825919151306153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.01,0.2622463941574097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,balanced,0.6504693428675333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.01,0.337990403175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.3361471891403198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,balanced,0.669701337814331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,balanced,4.51580270131429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.01,0.3510656118392944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.38188159465789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,balanced,0.708079973856608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.01,0.36459519863128664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.5101183891296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,balanced,0.749130646387736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.01,0.4006080150604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.5329919815063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,balanced,0.7813493410746256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.01,0.41672320365905763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,balanced,6.215391794840495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.5508927822113037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,balanced,0.8528532981872559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.01,0.4342144012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.5841728210449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,balanced,0.9764106273651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.01,0.4741568088531494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.6288896083831788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.01,0.5054656028747558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.6336192131042481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.01,0.526700782775879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,balanced,5.597322463989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.6533760070800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.01,0.5517759799957276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,balanced,1.1536426544189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.01,0.6422272205352784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.6792064189910889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.01,0.7121024131774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.7009791851043701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,power_law_1.01,0.1382591962814331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.01,0.8780096054077149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.7454592227935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,power_law_1.01,0.1490496039390564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.01,0.9750656127929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.8490816116333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,power_law_1.01,0.16848000288009643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.9208895683288574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.01,1.1983296394348144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,power_law_1.01,0.19523199796676635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,balanced,1.5404267311096191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,power_law_1.01,0.24972798824310302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.01,1.1494400024414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.01,1.4461248397827149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,balanced,9.428037643432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,power_law_1.01,0.30499839782714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,balanced,1.8467893600463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.01,1.2771136283874511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.01,1.9859968185424806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,power_law_1.01,0.3480063915252686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,power_law_1.01,0.4342912197113037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.01,1.6129791259765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.01,2.5110015869140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,balanced,2.2881867090861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,power_law_1.01,0.4566527843475342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.8769983291625976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.01,3.5973377227783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,power_law_1.01,0.47628159523010255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,balanced,8.53766949971517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,power_law_1.01,0.4968832015991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.01,2.518387222290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.01,4.4403839111328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,balanced,3.05894406636556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,power_law_1.01,0.5287295818328858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.01,3.1460287094116213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.01,5.425043106079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,power_law_1.01,0.5571904182434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.06531199812889099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,power_law_1.01,0.620198392868042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.01,4.4429374694824215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.0754751980304718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,balanced,4.0449174245198565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.01,8.401132965087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,power_law_1.01,0.6815743923187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.09099519848823548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.01,5.150713729858398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,power_law_1.01,0.732096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.13108479976654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,power_law_1.01,0.8331263542175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.01,6.202131271362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.01,18.65608367919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.19563519954681396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,power_law_1.01,1.0664128303527831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.29796481132507324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,balanced,5.766757329305013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.01,9.46517105102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.3527359962463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.01,1.2023615837097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.4762752056121826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.01,20.56243896484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.5153279781341553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.01,1.490988826751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.5272511959075927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.01,1.8194623947143556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,balanced,7.845312118530273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.5630911827087403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.01,2.4740543365478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.01,3.101260757446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.5800704002380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.01,4.350137710571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.6347968101501464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.01,5.600006484985352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.6487679958343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.6793727874755859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.01,8.100672149658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,balanced,20.24945576985677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.6902207851409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.01,10.567654418945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,balanced,10.712346394856771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.7602943897247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.880281639099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.01,13.093785095214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.9722944259643554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,balanced,18.114805857340496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,1,power_law_1.2,1.1585280418395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,power_law_1.01,20.51292724609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,1,power_law_1.2,1.3292223930358886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,1,power_law_1.2,1.648249626159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.9497152328491212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,power_law_1.01,40.492288208007814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,balanced,13.4344482421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,1,power_law_1.2,2.563257598876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,1,power_law_1.2,3.286054229736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,1,power_law_1.2,4.533158493041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,1,power_law_1.2,5.179110336303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,1,power_law_1.2,6.227078247070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.055776000022888184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,1,power_law_1.2,9.552108764648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.06339840292930603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.07452160120010376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.10114560127258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,1,power_law_1.2,20.618719482421874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.15032960176467897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.19916160106658937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,balanced,20.953226725260418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.2413248062133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,1,power_law_1.2,0.32215681076049807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,1,power_law_1.2,0.33422079086303713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,1,power_law_1.2,0.3562175989151001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,1,power_law_1.2,0.3943104028701782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,1,power_law_1.2,0.4200575828552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,1,power_law_1.2,0.43450241088867186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,1,power_law_1.2,0.47192959785461425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,1,power_law_1.2,0.4988224029541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,1,power_law_1.2,0.5384511947631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,1,power_law_1.2,0.5563007831573487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,1,power_law_1.2,0.6529600143432617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,0.7279232025146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,0.9042048454284668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,1.0057408332824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,1.2560832023620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,1.5161791801452638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,2.055891227722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,2.591155242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,3.694144058227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,4.473113632202148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,1,power_law_1.2,5.469535827636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,1,power_law_1.2,8.426163482666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,balanced,41.087076822916664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,1,power_law_1.2,18.486431884765626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,balanced,0.06223999957243601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,balanced,0.06311999758084615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,balanced,0.06404266754786174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,balanced,0.05569600065549215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,balanced,0.06165866553783417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,balanced,0.0844533344109853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,balanced,0.08771733442942302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,balanced,0.08822400371233623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,balanced,0.11414399743080139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,balanced,0.11446932951609294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,balanced,0.11318399508794148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,balanced,0.1919893423716227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,1,power_law_1.2,0.137990403175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,balanced,0.1895786722501119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,balanced,0.19012266397476196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,1,power_law_1.2,0.1485759973526001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,power_law_1.01,0.10391680002212525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,balanced,0.1883359948794047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,16,power_law_1.2,0.10590720176696777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,1,power_law_1.2,0.17424639463424682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,balanced,0.1876586675643921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,power_law_1.01,0.13458559513092042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,16,power_law_1.2,0.1119488000869751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,1,power_law_1.2,0.19316480159759522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,balanced,0.18735466400782266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,power_law_1.2,0.07731199860572815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,16,power_law_1.01,0.0843775987625122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,1,power_law_1.2,0.23374719619750978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,power_law_1.2,0.06951680183410644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,balanced,0.18800532817840576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,16,power_law_1.01,0.06476160287857055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,1,power_law_1.2,0.29100799560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,power_law_1.2,0.059910398721694944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,balanced,0.19062934319178262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,16,power_law_1.01,0.06407039761543273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,power_law_1.2,0.07461760044097901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,1,power_law_1.2,0.32760961055755616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,power_law_1.2,0.08464639782905578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,balanced,0.1967466672261556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,balanced,0.04829333225886027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,16,power_law_1.01,0.07762560248374939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,power_law_1.2,0.08315520286560059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,1,power_law_1.2,0.4208576202392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,power_law_1.2,0.10758399963378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,balanced,0.20690133174260458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,balanced,0.04896533489227295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,16,power_law_1.01,0.08229759931564332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,1,power_law_1.2,0.4492159843444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,power_law_1.2,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,balanced,0.05390933156013489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,16,power_law_1.01,0.08442879915237426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,power_law_1.2,0.1191167950630188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,balanced,0.22747733195622763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,1,power_law_1.2,0.4624512195587158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,power_law_1.2,0.19638400077819823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,balanced,0.0658186674118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,16,power_law_1.01,0.11390719413757325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,power_law_1.2,0.17984000444412232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,1,power_law_1.2,0.4867839813232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,balanced,0.07134399811426799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,balanced,0.24820266167322794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,16,power_law_1.01,0.11050239801406861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,power_law_1.2,0.1921023964881897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,1,power_law_1.2,0.5240511894226074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,power_law_1.2,0.18807679414749146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,balanced,0.08468266328175862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,16,power_law_1.01,0.11777280569076538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,power_law_1.2,0.19650559425354003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,1,power_law_1.2,0.5447167873382568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,balanced,0.08589866757392883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,balanced,0.4015359878540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,16,power_law_1.01,0.18835840225219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,power_law_1.2,0.20193920135498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,balanced,0.08637332916259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,1,power_law_1.2,0.6197760105133057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,power_law_1.2,0.2316864013671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,16,power_law_1.01,0.19100799560546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,balanced,0.0811413327852885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,power_law_1.2,0.2366719961166382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,1,power_law_1.2,0.6840191841125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,16,power_law_1.01,0.19225599765777587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,balanced,0.44526398181915283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,balanced,0.08190399905045827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,power_law_1.2,0.2929728031158447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,1,power_law_1.2,0.7274303913116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,16,power_law_1.01,0.18010879755020143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,balanced,0.08180266618728638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,power_law_1.2,0.3245503902435303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,balanced,0.11461333433787028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,power_law_1.2,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,16,power_law_1.01,0.19487359523773193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,1,power_law_1.2,0.8328127861022949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,power_law_1.2,0.6157375812530518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,balanced,0.11317333579063416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,balanced,0.6528693437576294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,16,power_law_1.01,0.19287680387496947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,1,power_law_1.2,1.0633791923522948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,power_law_1.2,0.7741184234619141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,balanced,0.11332266529401143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,power_law_1.2,1.0080063819885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,16,power_law_1.01,0.2049855947494507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,power_law_1.01,0.07204480171203613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,power_law_1.2,1.48657283782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,balanced,0.17665600776672363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,16,power_law_1.01,0.20982398986816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,power_law_1.01,0.09189119935035706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,power_law_1.2,2.3981056213378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.2,1.2125056266784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,balanced,0.17528533935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,16,power_law_1.01,0.2466304063796997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,balanced,0.8569119771321615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,power_law_1.01,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,power_law_1.2,2.7396991729736326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,balanced,0.17643199364344278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,16,power_law_1.01,0.32264320850372313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,power_law_1.01,0.07097600102424621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,power_law_1.2,4.778265762329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,balanced,0.17676266034444174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,16,power_law_1.01,0.4061888217926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,power_law_1.01,0.06955519914627076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.2,1.499897575378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,balanced,0.18041066328684488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,16,power_law_1.01,0.5169600009918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,power_law_1.2,11.984063720703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,power_law_1.01,0.07909119725227357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.2,1.8369407653808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,balanced,0.1875306765238444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,power_law_1.01,0.08318079710006714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,16,power_law_1.01,0.6335552215576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,balanced,1.0640479723612468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,power_law_1.01,0.08362240195274354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.2,2.5054527282714845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,16,power_law_1.01,0.8755071640014649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,balanced,0.19781333208084106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,power_law_1.01,0.07832319736480713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,16,power_law_1.01,1.1633407592773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.2,3.138431930541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,balanced,0.21838400761286417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,power_law_1.01,0.07921919822692872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,16,power_law_1.01,1.5699584007263183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,power_law_1.01,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.2,4.37017593383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,balanced,0.2408906618754069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,16,power_law_1.01,2.2434175491333006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,power_law_1.01,0.10355839729309083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.2,5.616128158569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,power_law_1.01,3.339168167114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,16,balanced,1.6701919237772624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,balanced,0.40651198228200275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,power_law_1.01,0.11385600566864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.2,8.106208038330077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,power_law_1.01,6.718450927734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,power_law_1.01,0.18837759494781495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,power_law_1.01,0.18197120428085328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,balanced,0.447215994199117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.2,10.505478668212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,power_law_1.01,0.18108160495758058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,power_law_1.01,0.20750079154968262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.2,12.995660400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,power_law_1.01,0.21893761157989503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,balanced,0.6540746688842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,power_law_1.01,0.24683520793914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,1,power_law_1.2,20.40312957763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,power_law_1.01,0.27486720085144045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,power_law_1.01,0.35501439571380616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,power_law_1.01,0.3953536033630371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,balanced,0.8572586377461752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,power_law_1.01,0.5451456069946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,1,power_law_1.2,40.18089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,16,balanced,3.304021199544271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,power_law_1.01,0.7149119853973389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,8,power_law_1.2,0.07159039974212647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,balanced,0.03435199956099192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,power_law_1.01,1.003718376159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,8,power_law_1.2,0.08652160167694092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,balanced,1.0655466715494792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,balanced,0.038746667404969536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,8,power_law_1.2,0.06234880089759827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,power_law_1.01,1.4272255897521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,balanced,0.039306665460268654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,8,power_law_1.2,0.07050880193710327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,power_law_1.01,1.6271232604980468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,8,power_law_1.2,0.06861439943313599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,balanced,0.06612800061702728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,8,power_law_1.2,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,power_law_1.01,2.5830720901489257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,balanced,0.07819733520348866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,8,power_law_1.2,0.08314239978790283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,balanced,0.0788320004940033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,power_law_1.01,5.631935882568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,balanced,1.6787947018941243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,8,power_law_1.2,0.08278399705886841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,balanced,0.08561600248018901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,8,power_law_1.2,0.07895039916038513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,balanced,0.08560533324877422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,8,power_law_1.2,0.08074880242347718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,balanced,0.08620267113049825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,8,power_law_1.2,0.07976959943771363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,balanced,0.08621866504351298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,balanced,0.08417066931724548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,8,power_law_1.2,0.10970239639282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,balanced,0.08432533343633015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,8,power_law_1.2,0.11421439647674561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,balanced,0.08487466971079509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,balanced,0.1113973359266917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,8,power_law_1.2,0.10926079750061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,balanced,0.10931199789047241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,8,power_law_1.2,0.18586879968643188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,balanced,0.11260799566904704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,8,power_law_1.2,0.18392319679260255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,balanced,0.1874613364537557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,8,power_law_1.2,0.18711040019989014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,balanced,0.19033600886662802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,8,power_law_1.2,0.2093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,balanced,0.19742933909098306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,8,power_law_1.2,0.23235840797424318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,balanced,3.317994753519694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,balanced,0.20677866538365683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,8,power_law_1.2,0.2665600061416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,8,power_law_1.2,0.32436480522155764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,balanced,0.2265440026919047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,8,power_law_1.2,0.39271039962768556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,balanced,0.24953599770863852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,8,power_law_1.2,0.509772777557373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,balanced,0.42163201173146564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,8,power_law_1.2,0.6076543807983399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,8,power_law_1.2,0.8621888160705566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,balanced,0.4668480157852173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,8,power_law_1.2,1.2311296463012695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,8,power_law_1.2,1.6232255935668944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,8,power_law_1.2,2.031276893615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,balanced,0.6791466871897379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,8,power_law_1.2,3.636147308349609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,8,power_law_1.2,7.063123321533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,balanced,0.8941919803619385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,power_law_1.01,0.03600000143051148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,balanced,1.1081279913584392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,power_law_1.01,0.04390400052070618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,power_law_1.01,0.04392960071563721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,power_law_1.01,0.05334399938583374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,power_law_1.01,0.06381440162658691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,power_law_1.01,0.06727039813995361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,power_law_1.01,0.07216640114784241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,power_law_1.01,0.07230719923973083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,4,power_law_1.2,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,balanced,1.7383519808451335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,4,power_law_1.2,0.04247680008411407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,power_law_1.01,0.08012160062789916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,4,power_law_1.2,0.03924480080604553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,power_law_1.01,0.0828544020652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,power_law_1.01,0.08254079818725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,4,power_law_1.2,0.05416319966316223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,power_law_1.01,0.08182399868965148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,4,power_law_1.2,0.05906559824943543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,power_law_1.01,0.08305280208587647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,4,power_law_1.2,0.06511359810829162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,power_law_1.01,0.11241600513458253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,4,power_law_1.2,0.071424001455307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,power_law_1.01,0.11651840209960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,4,power_law_1.2,0.07917439937591553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,power_law_1.01,0.11862399578094482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,4,power_law_1.2,0.0738752007484436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,power_law_1.01,0.20687360763549806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,4,power_law_1.2,0.07994880080223084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,power_law_1.01,0.22612481117248534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,4,power_law_1.2,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,4,power_law_1.2,0.0812991976737976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,power_law_1.01,0.23948800563812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,4,power_law_1.2,0.08362240195274354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,power_law_1.01,0.2649856090545654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,balanced,0.030533333619435627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,balanced,3.4344800313313804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,4,power_law_1.2,0.08300799727439881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,power_law_1.01,0.33987839221954347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,4,power_law_1.2,0.11596159934997559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,power_law_1.01,0.4298111915588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,power_law_1.01,0.030822399258613586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,balanced,0.03676266719897588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,balanced,0.04562133550643921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,power_law_1.01,0.5087999820709228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,4,power_law_1.2,0.11567360162734985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,power_law_1.01,0.0355648010969162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,power_law_1.01,0.667142391204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,4,power_law_1.2,0.12558720111846924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,power_law_1.01,0.03578239977359772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,balanced,0.06754666566848755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,power_law_1.01,0.04679040014743805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,4,power_law_1.2,0.20531840324401857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,power_law_1.01,0.9612159729003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,power_law_1.01,0.0568448007106781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,power_law_1.01,1.1786432266235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,4,power_law_1.2,0.23315839767456054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,balanced,0.08755200107892354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,power_law_1.01,0.06529279947280883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,4,power_law_1.2,0.256710410118103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,power_law_1.01,1.4446271896362304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,balanced,0.08020799855391185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,power_law_1.01,0.07141119837760926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,4,power_law_1.2,0.28897919654846194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,power_law_1.01,2.155462455749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,balanced,0.08049599826335907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,power_law_1.01,0.07265920042991639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,4,power_law_1.2,0.3646656036376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,balanced,0.0805920014778773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,power_law_1.01,4.699270248413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,power_law_1.01,0.07400959730148315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,balanced,0.08107199768225352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,4,power_law_1.2,0.4349823951721191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,power_law_1.01,0.07462400197982788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,balanced,0.08728532989819844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,4,power_law_1.2,0.6152575969696045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,power_law_1.01,0.08104959726333619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,balanced,0.08756800492604573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,2,power_law_1.2,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,balanced,0.08789333701133728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,4,power_law_1.2,0.6669439792633056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,power_law_1.01,0.08475520014762879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,balanced,0.08834667007128398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,2,power_law_1.2,0.0359360009431839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,power_law_1.01,0.08465279936790467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,4,power_law_1.2,1.114412784576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,balanced,0.08947199583053589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,2,power_law_1.2,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,4,power_law_1.2,1.325279998779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,power_law_1.01,0.08750079870223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,balanced,0.09185066819190979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,4,power_law_1.2,1.4542271614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,2,power_law_1.2,0.0474368005990982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,power_law_1.01,0.08751999735832214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,balanced,0.09328533212343852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,2,power_law_1.2,0.05514879822731018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,power_law_1.01,0.09900799989700318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,4,power_law_1.2,2.6448192596435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,2,power_law_1.2,0.0593280017375946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,balanced,0.12628799676895142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,power_law_1.01,0.10413440465927123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,balanced,0.02608533451954524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,4,power_law_1.2,5.417529678344726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,2,power_law_1.2,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,balanced,0.13149866461753845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,power_law_1.01,0.13282560110092162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,balanced,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,2,power_law_1.2,0.0742464005947113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,balanced,0.03364799916744232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,power_law_1.01,0.14150400161743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,balanced,0.2162933349609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,balanced,0.04667733112970988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,2,power_law_1.2,0.07420799732208253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,power_law_1.01,0.2553600072860718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,balanced,0.22747200727462769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,2,power_law_1.2,0.07524480223655701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,power_law_1.01,0.2762752056121826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,2,power_law_1.2,0.08262400031089782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,balanced,0.25098133087158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,power_law_1.01,0.347763204574585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,balanced,0.10104533036549886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,2,power_law_1.2,0.08450559973716736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,power_law_1.01,0.4107391834259033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,balanced,0.2775146762530009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,2,power_law_1.2,0.08599039912223816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,balanced,0.09923199812571208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,power_law_1.01,0.532908821105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,2,power_law_1.2,0.08752639889717102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,balanced,0.10046399633089702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,power_law_1.01,0.6686528205871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,balanced,0.4694133202234904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,2,power_law_1.2,0.0950655996799469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,balanced,0.09727999567985535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,power_law_1.01,0.9339967727661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,2,power_law_1.2,0.10025600194931031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,balanced,0.0963200032711029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,2,power_law_1.2,0.10581120252609252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,power_law_1.01,1.1569727897644042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,balanced,0.5177599986394247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,balanced,0.09754133224487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,2,power_law_1.2,0.13576960563659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,balanced,0.09795199831326802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,power_law_1.01,1.4071871757507324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,balanced,0.09773332873980205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,power_law_1.01,0.025459200143814087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,2,power_law_1.2,0.15500160455703735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,power_law_1.01,2.2138368606567385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,balanced,0.7532853285471598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,balanced,0.0995360016822815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,2,power_law_1.2,0.26356480121612547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,power_law_1.01,0.029798400402069092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,power_law_1.01,3.993862533569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,balanced,0.10046933094660442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,power_law_1.01,0.032569599151611325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,2,power_law_1.2,0.3062592029571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,power_law_1.01,0.04172160029411316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,2,power_law_1.2,0.36229119300842283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,balanced,0.1037546694278717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,power_law_1.01,0.05440639853477478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,2,power_law_1.2,0.43442559242248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,balanced,0.9876266320546468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,balanced,0.10814932982126872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,power_law_1.01,0.06450560092926025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,2,power_law_1.2,0.5778751850128174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,balanced,0.1283253331979116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,power_law_1.01,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,2,power_law_1.2,0.7516096115112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,power_law_1.01,0.08041599988937378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,balanced,0.13741333285967508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,2,power_law_1.2,0.9517312049865723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,power_law_1.01,0.08332160115242004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,balanced,1.2143200238545735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,power_law_1.01,0.08494719862937927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,balanced,0.1695893406867981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,2,power_law_1.2,1.2276032447814942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,2,power_law_1.2,1.456275177001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,power_law_1.01,0.08711040019989014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,balanced,0.18421866496404013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,power_law_1.01,0.08839679956436157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,power_law_1.2,2.4693695068359376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,power_law_1.01,0.09192320108413696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,balanced,0.33788267771402997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,power_law_1.2,4.330912017822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,power_law_1.01,0.10365439653396606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,balanced,0.3686613241831462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,2,balanced,1.9157333374023438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,power_law_1.01,0.11507840156555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,power_law_1.01,0.13066879510879517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,balanced,0.632207989692688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,power_law_1.01,0.14387199878692628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,power_law_1.01,0.1670464038848877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,balanced,0.6899147033691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,power_law_1.01,0.20880000591278075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,power_law_1.01,0.25063040256500246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,power_law_1.01,0.4338687896728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,balanced,1.0065546830495198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,power_law_1.01,0.516486406326294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,power_law_1.01,0.6734272003173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,power_law_1.01,0.8258048057556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,1,power_law_1.2,0.025356799364089966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,power_law_1.01,1.142585563659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,balanced,1.3147839705149333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,1,power_law_1.2,0.0296640008687973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,2,balanced,3.769909222920736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,power_law_1.01,1.451052761077881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,1,power_law_1.2,0.031711998581886294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,1,power_law_1.2,0.04207360148429871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,power_law_1.01,1.7712448120117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,1,power_law_1.2,0.05118079781532288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,power_law_1.01,2.6979583740234374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,1,power_law_1.2,0.06079999804496765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,1,power_law_1.2,0.07822080254554749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,balanced,1.6250826517740886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,power_law_1.01,5.167206573486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,1,power_law_1.2,0.08309760093688964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,1,power_law_1.2,0.08334720134735107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,1,power_law_1.2,0.08429440259933471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,1,power_law_1.2,0.08731520175933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,1,power_law_1.2,0.08840960264205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,1,power_law_1.2,0.09316480159759521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,1,power_law_1.2,0.09970560073852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,1,power_law_1.2,0.10926079750061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,balanced,2.559157371520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,1,power_law_1.2,0.11806080341339112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,1,power_law_1.2,0.13333760499954223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,1,power_law_1.2,0.147980797290802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,1,power_law_1.2,0.1706496000289917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,1,power_law_1.2,0.2174015998840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,1,power_law_1.2,0.2596479892730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,1,power_law_1.2,0.4639552116394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,1,power_law_1.2,0.5412352085113525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,1,power_law_1.2,0.6949632167816162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,1,power_law_1.2,0.852780818939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,1,power_law_1.2,1.163980770111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,1,power_law_1.2,1.4784768104553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,1,power_law_1.2,1.7901824951171874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,balanced,0.056890666484832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,power_law_1.01,0.06721919775009155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,1,power_law_1.2,2.7197376251220704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,balanced,5.050698598225911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,1,power_law_1.2,5.243289566040039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,balanced,0.057818666100502014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,power_law_1.01,0.056377601623535153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,power_law_1.01,0.058924800157546996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,balanced,0.058101331194241844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,16,power_law_1.2,0.06735360026359558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,power_law_1.01,0.05472000241279602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,balanced,0.05514133473237356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,16,power_law_1.2,0.06146559715270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,16,power_law_1.2,0.06272640228271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,16,power_law_1.2,0.05548160076141358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,power_law_1.01,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,power_law_1.2,0.0592960000038147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,16,balanced,0.05991999804973602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,power_law_1.01,0.06924800276756286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,power_law_1.2,0.0690559983253479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,16,balanced,0.0678719977537791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,power_law_1.01,0.07663999795913697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,power_law_1.2,0.07933440208435058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,16,balanced,0.07649066547552745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,power_law_1.01,0.07497599720954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,balanced,0.04674133161703745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,power_law_1.2,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,power_law_1.01,0.08783360123634339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,16,balanced,0.0741066684325536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,power_law_1.01,0.0904640018939972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,power_law_1.2,0.09013760089874268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,16,balanced,0.08713600039482117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,power_law_1.01,0.09139840006828308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,balanced,0.048010667165120445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,balanced,0.08881066242853801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,16,power_law_1.2,0.08764799833297729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,power_law_1.01,0.0917631983757019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,balanced,0.0876586635907491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,16,power_law_1.2,0.09054719805717468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,power_law_1.01,0.09348480105400085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,balanced,0.08654933174451192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,balanced,0.051301335295041404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,16,power_law_1.2,0.0927295982837677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,power_law_1.01,0.09840000271797181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,balanced,0.08762133121490479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,balanced,0.04965866605440775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,power_law_1.01,0.11543680429458618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,16,power_law_1.2,0.10213760137557984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,balanced,0.0881706674893697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,power_law_1.01,0.11293439865112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,balanced,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,balanced,0.08815466364224751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,16,power_law_1.2,0.11196160316467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,power_law_1.01,0.11809920072555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,balanced,0.05504000186920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,balanced,0.08921066919962566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,16,power_law_1.2,0.11123199462890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,power_law_1.01,0.16762239933013917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,balanced,0.06275199850400288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,power_law_1.01,0.18405760526657106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,16,power_law_1.2,0.11365760564804077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,balanced,0.09135466814041138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,balanced,0.06354666749636333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,power_law_1.01,0.2590656042098999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,16,power_law_1.2,0.14151040315628052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,balanced,0.09642133116722107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,power_law_1.01,0.3224064111709595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,16,power_law_1.2,0.19196159839630128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,power_law_1.01,0.5206719875335694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,balanced,0.10002133250236511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,balanced,0.07018666466077168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,power_law_1.01,0.06332160234451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,16,power_law_1.2,0.19718400239944459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,power_law_1.01,0.6807104110717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,balanced,0.07096533477306366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,balanced,0.12875733772913614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,power_law_1.01,0.9555199623107911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,16,power_law_1.2,0.3325952053070068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,power_law_1.01,0.04989440143108368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,balanced,0.07026666899522145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,power_law_1.01,1.1469440460205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,balanced,0.13700266679128012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,16,power_law_1.2,0.4151872158050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,power_law_1.01,0.05554559826850891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,balanced,0.07097066442171733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,power_law_1.01,1.794233512878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,power_law_1.2,0.5643072128295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,power_law_1.01,0.05159040093421936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,balanced,0.0719946672519048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,16,balanced,0.2114773392677307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,power_law_1.01,2.4905216217041017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,power_law_1.01,0.05048959851264954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,power_law_1.2,0.7100800037384033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,balanced,0.07215466598669688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,power_law_1.01,3.89251823425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,power_law_1.01,0.05493119955062866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,balanced,0.07342400153477986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,power_law_1.2,1.2410304069519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,16,balanced,0.2423200011253357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,power_law_1.01,5.746195220947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,power_law_1.01,0.06405119895935059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,balanced,0.07663999994595845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,power_law_1.2,1.7227903366088868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,8,power_law_1.2,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,power_law_1.01,0.06408960223197938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,balanced,0.07959466675917308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,16,balanced,0.35152534643809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,power_law_1.01,10.340691375732423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,power_law_1.2,2.9162111282348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,8,power_law_1.2,0.05790719985961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,power_law_1.01,0.07605760097503662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,balanced,0.08284799754619598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,power_law_1.2,3.5545406341552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,8,power_law_1.2,0.05923200249671936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,power_law_1.01,0.0738048017024994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,power_law_1.01,0.08067839741706848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,balanced,0.1327946682771047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,8,power_law_1.2,0.05101439952850342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,16,balanced,0.436901330947876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,power_law_1.2,4.044300842285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,power_law_1.01,0.07466880083084107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,8,power_law_1.2,0.050195199251174924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,balanced,0.14099199573198953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,power_law_1.01,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,power_law_1.2,7.697113800048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,8,power_law_1.2,0.05494400262832642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,power_law_1.01,0.08136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,balanced,0.19992534319559732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,16,balanced,0.6420799891153971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,8,power_law_1.2,0.06366080045700073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,power_law_1.01,0.08777599930763244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,power_law_1.2,15.180160522460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,8,power_law_1.2,0.06291840076446534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,balanced,0.23267199595769247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,power_law_1.01,0.1023743987083435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,8,power_law_1.2,0.07453439831733703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,power_law_1.01,0.1200063943862915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,8,power_law_1.2,0.08334720134735107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,balanced,0.33842666943868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,power_law_1.01,0.1372607946395874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,16,balanced,0.8433279991149902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,8,power_law_1.2,0.0827455997467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,power_law_1.01,0.15821440219879152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,8,power_law_1.2,0.08206080198287964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,power_law_1.01,0.21458559036254882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,balanced,0.4397653341293335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,8,power_law_1.2,0.08595839738845826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,power_law_1.01,0.2226560115814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,8,power_law_1.2,0.10439679622650147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,power_law_1.01,0.37154560089111327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,16,balanced,1.0496959686279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,8,power_law_1.2,0.10861439704895019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,balanced,0.6448266506195068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,power_law_1.01,0.5252287864685059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,8,power_law_1.2,0.11237119436264038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,power_law_1.01,0.6807487964630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,8,power_law_1.2,0.1206015944480896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,8,power_law_1.2,0.14453760385513306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,power_law_1.01,0.7923391819000244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,8,power_law_1.2,0.17473920583724975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,power_law_1.01,1.427660846710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,balanced,0.848095973332723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,8,power_law_1.2,0.23571839332580566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,power_law_1.01,1.5881279945373534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,8,power_law_1.2,0.31356799602508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,16,balanced,1.6559146245320637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,balanced,0.03332266708215078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,power_law_1.01,0.034329599142074584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,power_law_1.01,2.253228759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,8,power_law_1.2,0.4147327899932861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,balanced,0.03660800059636434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,power_law_1.01,0.03776000142097473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,8,power_law_1.2,0.5272064208984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,power_law_1.01,2.9845888137817385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,balanced,0.03896533449490865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,power_law_1.01,0.03866240084171295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,8,power_law_1.2,1.010655975341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,balanced,1.0535306930541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,power_law_1.01,0.04411520063877106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,power_law_1.01,8.352934265136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,8,power_law_1.2,1.2204352378845216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,8,power_law_1.2,1.692108726501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,balanced,0.04437866806983948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,power_law_1.01,0.04418559968471527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,balanced,0.042378668983777366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,8,power_law_1.2,2.493337631225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,power_law_1.01,0.043968001008033754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,balanced,0.04514666895071665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,8,power_law_1.2,2.5023359298706054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,balanced,0.04673066735267639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,power_law_1.01,0.04733439981937408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,power_law_1.01,0.049465599656105044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,power_law_1.2,4.690784072875976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,8,balanced,1.6670667330423992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,balanced,0.05565333366394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,power_law_1.2,10.345503997802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,power_law_1.01,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,balanced,0.05064000189304352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,balanced,0.051818668842315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,power_law_1.01,0.053350400924682614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,16,balanced,3.285877227783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,power_law_1.01,0.059564799070358276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,balanced,0.08217066526412964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,balanced,0.0732586681842804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,power_law_1.01,0.08739200234413147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,balanced,0.07379733522733052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,power_law_1.01,0.08426240086555481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,balanced,0.0741066684325536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,power_law_1.01,0.07928320169448852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,balanced,0.07805866499741872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,power_law_1.01,0.08111360073089599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,power_law_1.01,0.0913919985294342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,balanced,0.07910933097203572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,power_law_1.01,0.1000704050064087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,8,balanced,3.298997243245443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,balanced,0.08346133430798848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,power_law_1.01,0.12483199834823608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,balanced,0.08654399712880452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,power_law_1.01,0.1316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,balanced,0.12986133495966592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,power_law_1.01,0.17789440155029296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,balanced,0.1394719978173574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,power_law_1.01,0.1989824056625366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,power_law_1.01,0.2781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,balanced,0.19716266791025797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,power_law_1.01,0.40480642318725585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,power_law_1.01,0.5250751972198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,balanced,0.23860265811284384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,power_law_1.01,0.6928768157958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,power_law_1.01,0.9955904006958007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,balanced,0.3535039822260539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,power_law_1.01,1.3440320014953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,power_law_1.01,1.6744895935058595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,balanced,0.4534720182418823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,power_law_1.01,2.498860740661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,power_law_1.01,4.704774475097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,balanced,0.66539200146993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,4,power_law_1.2,0.03456639945507049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,4,power_law_1.2,0.03857280015945434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,4,power_law_1.2,0.038540801405906676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,balanced,0.874122699101766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,4,power_law_1.2,0.04385280013084412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,4,power_law_1.2,0.043680000305175784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,4,power_law_1.2,0.04229759871959686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,balanced,0.029493334392706554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,4,power_law_1.2,0.0466048002243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,balanced,1.0873226324717205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,balanced,0.033610666791598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,4,power_law_1.2,0.051500797271728516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,4,power_law_1.2,0.058873599767684935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,4,power_law_1.2,0.057785600423812866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,4,power_law_1.2,0.060678398609161376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,balanced,0.04342400034268697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,4,power_law_1.2,0.08863360285758973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,4,power_law_1.2,0.08558719754219055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,balanced,0.04341333111127218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,4,power_law_1.2,0.08370559811592101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,balanced,1.7203680674235027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,4,power_law_1.2,0.08328959941864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,balanced,0.04379733403523763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,4,power_law_1.2,0.09400320053100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,4,power_law_1.2,0.11084799766540528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,balanced,0.04795200129350027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,4,power_law_1.2,0.1339967966079712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,balanced,0.04478399952252706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,4,power_law_1.2,0.13400319814682007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,balanced,0.04552533229192098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,4,power_law_1.2,0.17431679964065552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,4,power_law_1.2,0.23809280395507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,balanced,0.05696000158786774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,4,power_law_1.2,0.3326656103134155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,balanced,0.05471999943256378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,4,power_law_1.2,0.4033023834228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,balanced,0.055455997586250305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,4,power_law_1.2,0.6458111763000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,4,power_law_1.2,0.8205056190490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,4,power_law_1.2,1.084652805328369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,4,power_law_1.2,1.512070369720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,power_law_1.01,0.030374398827552794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,balanced,3.3902292251586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,balanced,0.0836906631787618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,4,power_law_1.2,2.0800960540771483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,power_law_1.01,0.03359360098838806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,balanced,0.07810133198897044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,power_law_1.01,0.0333759993314743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,4,power_law_1.2,3.532089614868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,balanced,0.07966400186220805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,power_law_1.01,0.039001598954200745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,power_law_1.01,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,balanced,0.08452799916267395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,4,power_law_1.2,6.4735870361328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,power_law_1.01,0.04497919976711273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,balanced,0.08878399928410848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,power_law_1.01,0.04963839948177338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,power_law_1.01,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,balanced,0.13969066739082336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,2,power_law_1.2,0.030118399858474733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,balanced,0.025562666356563568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,power_law_1.01,0.05479679703712463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,balanced,0.1508693297704061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,balanced,0.029994666576385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,2,power_law_1.2,0.03296639919281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,power_law_1.01,0.055731201171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,balanced,0.03233599911133448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,2,power_law_1.2,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,balanced,0.21669334173202515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,power_law_1.01,0.057222402095794676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,balanced,0.046613335609436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,2,power_law_1.2,0.03784320056438446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,power_law_1.01,0.05924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,balanced,0.2649386723836263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,balanced,0.04604266583919525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,power_law_1.01,0.0641215980052948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,2,power_law_1.2,0.046265599131584165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,2,power_law_1.2,0.04474239945411682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,power_law_1.01,0.06725760102272034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,balanced,0.3933813174565633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,balanced,0.04613866905371348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,power_law_1.01,0.09196159839630128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,2,power_law_1.2,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,power_law_1.01,0.025791999697685242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,power_law_1.01,0.08885759711265565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,balanced,0.0448586642742157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,2,power_law_1.2,0.05095040202140808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,power_law_1.01,0.02800000011920929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,balanced,0.5044639905293783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,balanced,0.044490665197372437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,power_law_1.01,0.08991360068321227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,2,power_law_1.2,0.05594239830970764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,balanced,0.04537599782148997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,power_law_1.01,0.1223680019378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,power_law_1.01,0.030393600463867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,2,power_law_1.2,0.05586559772491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,balanced,0.045082668463389076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,power_law_1.01,0.03617280125617981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,2,power_law_1.2,0.05736320018768311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,power_law_1.01,0.13100160360336305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,balanced,0.7354559898376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,balanced,0.04543466866016388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,power_law_1.01,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,2,power_law_1.2,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,power_law_1.01,0.1671872019767761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,2,power_law_1.2,0.0661184012889862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,balanced,0.04882133503754934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,power_law_1.01,0.1892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,power_law_1.01,0.0444927990436554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,2,power_law_1.2,0.06743680238723755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,balanced,0.04877866804599762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,power_law_1.01,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,power_law_1.01,0.25936639308929443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,balanced,0.9655840396881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,2,power_law_1.2,0.0942463994026184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,balanced,0.05106666684150696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,power_law_1.01,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,power_law_1.01,0.3661632061004639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,2,power_law_1.2,0.08780800104141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,balanced,0.05774933099746704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,power_law_1.01,0.05082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,power_law_1.01,0.4899007797241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,2,power_law_1.2,0.10265599489212036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,power_law_1.01,0.051974397897720334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,balanced,0.05926933387915293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,power_law_1.01,0.629145622253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,2,power_law_1.2,0.12476160526275634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,power_law_1.01,0.05356159806251526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,balanced,0.06318399806817372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,power_law_1.01,0.9586048126220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,balanced,1.1887626647949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,power_law_1.01,0.05738239884376526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,2,power_law_1.2,0.13210879564285277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,balanced,0.09479999542236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,power_law_1.01,1.1965248107910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,power_law_1.01,0.0584384024143219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,2,power_law_1.2,0.16586240530014038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,balanced,0.10056533416112264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,power_law_1.01,1.4327808380126954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,power_law_1.01,0.061343997716903687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,2,power_law_1.2,0.20639359951019287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,balanced,0.17042134205500284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,power_law_1.01,2.569830322265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,power_law_1.01,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,2,power_law_1.2,0.2981631994247437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,balanced,0.18346667289733887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,power_law_1.01,4.587206268310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,power_law_1.01,0.07406719923019409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,2,power_law_1.2,0.366540789604187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,power_law_1.01,0.07869439721107482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,balanced,0.26791999737421673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,2,power_law_1.2,0.515231990814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,balanced,1.8774293263753254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,power_law_1.01,0.13325439691543578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,2,power_law_1.2,0.6773695945739746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,1,power_law_1.2,0.024742400646209715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,balanced,0.3508053223292033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,power_law_1.01,0.14669439792633057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,2,power_law_1.2,0.9419903755187988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,1,power_law_1.2,0.02773759961128235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,power_law_1.01,0.19794559478759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,2,power_law_1.2,1.3405376434326173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,1,power_law_1.2,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,balanced,0.5136373440424601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,power_law_1.01,0.22780160903930663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,2,power_law_1.2,1.584716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,1,power_law_1.2,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,power_law_1.01,0.3096575975418091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,1,power_law_1.2,0.044710400700569156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,2,power_law_1.2,2.750655937194824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,power_law_1.01,0.39164159297943113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,balanced,0.6702240308125814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,1,power_law_1.2,0.04343680143356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,power_law_1.01,0.5522560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,power_law_1.2,4.979539108276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,1,power_law_1.2,0.04872959852218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,power_law_1.01,0.7101376056671143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,1,power_law_1.2,0.04895359873771667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,balanced,0.9842613538106283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,power_law_1.01,1.020902442932129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,1,power_law_1.2,0.050297600030899045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,power_law_1.01,1.333414363861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,1,power_law_1.2,0.05177599787712097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,2,balanced,3.709013303120931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,1,power_law_1.2,0.05354239940643311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,power_law_1.01,1.6432191848754882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,1,power_law_1.2,0.05737599730491638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,power_law_1.01,2.573676872253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,balanced,1.2949386437733967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,1,power_law_1.2,0.05803520083427429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,power_law_1.01,5.043679809570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,1,power_law_1.2,0.060627198219299315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,1,power_law_1.2,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,1,power_law_1.2,0.07415040135383606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,1,power_law_1.2,0.07901440262794494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,balanced,1.6053172747294109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,1,power_law_1.2,0.13441920280456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,1,power_law_1.2,0.1473855972290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,1,power_law_1.2,0.1961856007575989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,balanced,0.05736533304055532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,balanced,0.04624533156553904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,1,power_law_1.2,0.22700159549713134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,balanced,0.05881600081920624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,balanced,0.04612799982229868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,1,power_law_1.2,0.31040000915527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,balanced,0.05781333148479462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,balanced,0.04610133171081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,1,power_law_1.2,0.39149439334869385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,balanced,0.060090666015942894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,balanced,0.04872000217437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,balanced,0.06018133461475372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,1,power_law_1.2,0.5506368160247803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,balanced,0.060378665725390114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,balanced,2.53767999013265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,balanced,0.04840533435344696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,1,power_law_1.2,0.7063744068145752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,balanced,0.060959999759991966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,balanced,0.048384000857671104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,balanced,0.06412800153096516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,1,power_law_1.2,1.0224639892578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,balanced,0.04950400193532308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,balanced,0.06376533210277557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,1,power_law_1.2,1.325881576538086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,balanced,0.06427200138568878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,balanced,0.04901333153247833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,1,power_law_1.2,1.636627197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,balanced,0.07066133121649425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,balanced,0.050341332952181496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,balanced,0.06322133541107178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,1,power_law_1.2,2.5644607543945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,balanced,0.05039466420809428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,balanced,0.0626986672480901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,balanced,0.05063466727733612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,power_law_1.2,5.033388900756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,balanced,0.06444266438484192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,balanced,0.0499893327554067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,balanced,0.07223999996980031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,balanced,0.051088000337282814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,balanced,0.07227199772993724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,balanced,0.051829333106676735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,balanced,0.058864002426465355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,balanced,0.07167999943097432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,balanced,0.059530665477116905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,balanced,0.08915199836095174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,balanced,0.05975999931494395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,balanced,0.08371733625729878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,balanced,0.07253333429495494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,balanced,0.1144533356030782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,1,balanced,5.023562749226888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,balanced,0.07339733342329662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,balanced,0.11037333806355794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,balanced,0.10321600238482158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,balanced,0.15533333023389181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,balanced,0.10433066884676616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,balanced,0.17715734243392944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,balanced,0.1437493364016215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,balanced,0.2664480010668437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,balanced,0.16113066673278809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,balanced,0.31705600023269653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,balanced,0.2225066622098287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,balanced,0.4645386536916097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,balanced,0.28045332431793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,balanced,0.40556267897288006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,balanced,0.5676213502883911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,balanced,0.5142346620559692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,balanced,0.7091253598531088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,balanced,0.6374133427937826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,balanced,1.0938613414764404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,balanced,0.040133332212766014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,balanced,0.03858133405447006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,balanced,0.9819466272989908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,balanced,0.03842666745185852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,balanced,0.04234666625658671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,balanced,0.04225599765777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,balanced,0.04303466777006785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,balanced,2.1464160283406577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,balanced,0.043653334180514015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.01,0.04412800073623657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.01,0.056985598802566526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,balanced,1.9011573791503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.01,0.056390398740768434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.01,0.04645760059356689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.01,0.0585536003112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,balanced,0.04604266583919525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.01,0.04428159892559051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.01,0.059059202671051025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.01,0.048825600743293764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.01,0.06346880197525025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.01,0.04739840030670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.01,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.01,0.04895359873771667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.01,0.06437119841575623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.01,0.053401601314544675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.01,0.070169597864151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,balanced,0.0452159990866979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.01,0.07037439942359924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.01,0.051641601324081424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,power_law_1.01,0.037625598907470706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.01,0.07101439833641052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.01,0.055430400371551516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,balanced,0.04650133351484934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,power_law_1.01,0.03790720105171204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.01,0.0802623987197876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.01,0.06046079993247986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,balanced,0.04717866579691569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.01,0.08303359746932984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,power_law_1.01,0.03776639997959137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.01,0.05420799851417542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,balanced,0.0467199981212616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.01,0.09268479943275451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,power_law_1.01,0.04103040099143982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,power_law_1.01,0.04168320000171662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.01,0.11153279542922974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.01,0.0650111973285675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,power_law_1.01,0.044531199336051944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.01,0.10792959928512573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.01,0.06607360243797303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,power_law_1.01,0.048511999845504764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.01,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.01,0.08120319843292237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,balanced,0.05426133175690969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.01,0.1828927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,power_law_1.01,0.052095997333526614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.01,0.09107199907302857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,balanced,0.05481599768002828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.01,0.09477120041847228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,power_law_1.01,0.056460797786712646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.01,0.2387712001800537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,balanced,0.05505066613356272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.01,0.12469760179519654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,power_law_1.01,0.06257920265197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.01,0.14302079677581786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.01,0.3594944000244141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,4,8,power_law_1.2,0.056377601623535153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.01,0.178220796585083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.01,0.3130687952041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.01,0.24231040477752686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,power_law_1.01,0.053491199016571046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,4,8,power_law_1.2,0.05719040036201477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.01,0.45401601791381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.01,0.36149120330810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,power_law_1.01,0.0658240020275116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,4,8,power_law_1.2,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.01,0.344870400428772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.01,0.5205183982849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,power_law_1.01,0.06776319742202759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,4,8,power_law_1.2,0.058822399377822875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,balanced,0.06446933249632518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.01,0.5395135879516602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.01,0.791155195236206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,power_law_1.01,0.07756800055503846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,4,8,power_law_1.2,0.05939840078353882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.01,0.7212416172027588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,balanced,0.06737066805362701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.01,0.9820992469787597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.01,1.0966912269592286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,4,8,power_law_1.2,0.06355839967727661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.01,1.4620287895202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.01,1.3368191719055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,4,8,power_law_1.2,0.06838399767875672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,power_law_1.01,0.08333439826965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,4,8,power_law_1.2,0.043289598822593686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.01,1.865247917175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.01,1.8122367858886719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,4,8,power_law_1.2,0.06473600268363952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,power_law_1.01,0.08721920251846313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.01,2.4392255783081054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,4,8,power_law_1.2,0.07825919985771179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,power_law_1.01,0.10021760463714599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.01,2.6011199951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,4,8,power_law_1.2,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.01,3.8974720001220704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,4,8,power_law_1.2,0.07553279995918274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,balanced,0.08566400408744812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.01,4.676774215698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,4,8,power_law_1.2,0.04390400052070618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,4,8,power_law_1.2,0.07271040081977845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.01,7.876499176025391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,4,8,power_law_1.2,0.04645119905471802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,power_law_1.01,0.1271615982055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,4,8,power_law_1.2,0.08486400246620178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,power_law_1.01,0.16090240478515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,4,8,power_law_1.2,0.04653440117835998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,4,8,power_law_1.2,0.09326720237731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,balanced,0.09713600079218547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,4,8,power_law_1.2,0.04867199957370758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,4,8,power_law_1.2,0.09127680063247681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,balanced,0.1350933313369751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,4,8,power_law_1.2,0.054099202156066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,4,8,power_law_1.2,0.11562880277633666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,power_law_1.01,0.2219327926635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,4,8,power_law_1.2,0.1198464035987854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,4,8,power_law_1.2,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,4,8,power_law_1.2,0.13384319543838502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,power_law_1.01,0.2585472106933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,4,8,power_law_1.2,0.06104959845542908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,4,8,power_law_1.2,0.16640640497207643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,power_law_1.01,0.34841599464416506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,balanced,0.16790932416915894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,4,8,power_law_1.2,0.061452800035476686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,4,8,power_law_1.2,0.22862720489501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,4,8,power_law_1.2,0.05479679703712463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,balanced,0.23662932713826498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,4,8,power_law_1.2,0.34780800342559814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,power_law_1.01,0.5481984138488769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,4,8,power_law_1.2,0.06289920210838318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,4,8,power_law_1.2,0.30186240673065184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,power_law_1.01,0.6639359951019287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,balanced,0.3017226656277974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,4,8,power_law_1.2,0.06714239716529846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,4,8,power_law_1.2,0.4482816219329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,power_law_1.01,1.0820735931396483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,4,8,power_law_1.2,0.06391680240631104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,4,8,power_law_1.2,0.49205760955810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,4,8,power_law_1.2,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,4,8,power_law_1.2,0.8072640419006347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,4,8,power_law_1.2,0.0899839997291565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,4,8,power_law_1.2,0.969542407989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,4,8,power_law_1.2,0.09794560074806213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,4,8,power_law_1.2,1.467033576965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,balanced,0.5009599924087524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,power_law_1.01,1.701228713989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,4,8,power_law_1.2,0.12744319438934326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,4,8,power_law_1.2,1.987615966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,power_law_1.01,2.1935680389404295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,4,8,power_law_1.2,0.15322879552841187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,4,8,power_law_1.2,2.449247932434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,4,8,power_law_1.2,0.21000959873199462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,balanced,0.6279946565628052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,power_law_1.01,2.5116031646728514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,4,8,power_law_1.2,3.817087936401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,4,8,power_law_1.2,0.25873279571533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,power_law_1.01,4.079212951660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,4,8,power_law_1.2,0.3831360101699829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,4,8,power_law_1.2,7.255149078369141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,balanced,0.7742453416188558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,4,8,power_law_1.2,0.35267200469970705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,power_law_1.01,8.62402572631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,4,8,power_law_1.2,0.5467199802398681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,balanced,0.05093333125114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,4,8,power_law_1.2,0.7291264057159423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,balanced,0.04753066599369049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,4,8,power_law_1.2,1.0984127998352051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,balanced,1.2140106360117595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,balanced,0.05710400144259135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,4,8,power_law_1.2,1.4183103561401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,balanced,0.0611413319905599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,4,8,power_law_1.2,1.8157567977905273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,balanced,0.06065066655476888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,4,8,power_law_1.2,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,balanced,0.06099733213583628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,4,8,power_law_1.2,2.6578048706054687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,4,8,power_law_1.2,0.03763839900493622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,balanced,0.06164266665776571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,balanced,0.06222933530807495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,4,8,power_law_1.2,0.03743999898433685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,4,8,power_law_1.2,5.064902496337891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,balanced,0.061333333452542625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,4,8,power_law_1.2,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,balanced,0.06137600044409434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,4,8,power_law_1.2,0.041555199027061465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,balanced,0.06253866851329803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,4,8,power_law_1.2,0.0430976003408432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,balanced,2.3871359825134277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,4,8,power_law_1.2,0.04785920083522797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,balanced,0.06319466729958852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,balanced,0.0631573349237442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,4,8,power_law_1.2,0.050860798358917235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,balanced,0.0643093337615331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,4,8,power_law_1.2,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,balanced,0.07234133283297221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,4,8,power_law_1.2,0.061990398168563846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,balanced,0.07348266740640004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,balanced,0.07227733234564464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,balanced,0.08578667044639587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,4,8,power_law_1.2,0.0543936014175415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,balanced,0.09102933605511983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,4,8,power_law_1.2,0.058534401655197146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,balanced,0.11120532949765523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,4,8,power_law_1.2,0.06577280163764954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,balanced,0.11545600493748982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,4,8,power_law_1.2,0.0827072024345398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,balanced,0.17760000626246134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,4,8,power_law_1.2,0.08173440098762512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,balanced,0.1914506753285726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,4,8,power_law_1.2,0.08513919711112976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,balanced,0.26893333594004315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,4,8,power_law_1.2,0.10944639444351197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,balanced,0.34326398372650146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,4,8,power_law_1.2,0.13155839443206788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,balanced,0.49741331736246747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,4,8,power_law_1.2,0.1653887987136841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,balanced,0.6140960057576498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,4,8,power_law_1.2,0.2172800064086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,4,8,power_law_1.2,0.28531200885772706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,4,8,power_law_1.2,0.4733119964599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,balanced,0.7780053615570068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,4,8,power_law_1.2,0.5895103931427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,balanced,0.037733333806196846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,4,8,power_law_1.2,0.8432255744934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,4,8,power_law_1.2,1.1280447959899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,balanced,0.03855466594298681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,balanced,1.2235253651936848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,balanced,0.042821332812309265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,4,8,power_law_1.2,1.8461759567260743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,balanced,0.04612799982229868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,balanced,0.045461331804593406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,4,8,power_law_1.2,2.1992448806762694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,4,8,power_law_1.2,2.633535957336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,balanced,0.04774933556715647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,balanced,0.04859733581542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,4,8,power_law_1.2,4.349555206298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,balanced,0.04890666902065277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,balanced,0.04956266780694326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,4,8,power_law_1.2,8.296403503417968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,balanced,0.02848000079393387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,balanced,2.315274715423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,balanced,0.028346667687098186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,balanced,0.05077333251635233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,balanced,0.035904000202814736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,balanced,0.052789335449536644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,balanced,0.04005866746107737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,balanced,0.053445334235827126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.01,0.051526397466659546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,balanced,0.05993066728115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,balanced,0.04140799989302953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.01,0.05321599841117859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,balanced,0.06035733222961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,balanced,0.04224533339341482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.01,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,balanced,0.041573333243529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.01,0.0610368013381958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,balanced,0.06195733447869619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,balanced,0.04594666759173075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.01,0.059935998916625974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,balanced,0.07297066847483318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,balanced,0.04656533400217692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.01,0.060057598352432254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,balanced,0.07962666451931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.01,0.06260480284690857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.01,0.06548479795455933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,balanced,0.09614400068918864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.01,0.043750399351119997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.01,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.01,0.04314239919185638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,balanced,0.10595200459162395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.01,0.0744704008102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.01,0.039084801077842714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,balanced,0.15107199549674988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.01,0.0447488009929657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,balanced,0.04586133360862732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.01,0.04454399943351746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.01,0.07198079824447631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,balanced,0.1768959959348043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,balanced,0.04610666632652283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.01,0.04762240052223206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.01,0.08363519906997681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,balanced,0.04712533454100291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,balanced,0.24865599473317465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.01,0.08299520015716552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.01,0.04838399887084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,balanced,0.047007997830708824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.01,0.05359359979629517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.01,0.09566079974174499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,balanced,0.32178666194279987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,4,power_law_1.2,0.04805119931697845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.01,0.060787200927734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.01,0.09943040013313294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,4,power_law_1.2,0.052908802032470705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,balanced,0.4730986754099528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,4,power_law_1.2,0.055366402864456175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.01,0.0585536003112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.01,0.103603196144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,power_law_1.01,0.03201279938220978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.01,0.13448959589004517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,4,power_law_1.2,0.059654402732849124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.01,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.01,0.16573439836502074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,4,power_law_1.2,0.06069759726524353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,power_law_1.01,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.01,0.0650111973285675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.01,0.21010560989379884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,balanced,0.5683893362681071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,balanced,0.05474133292833964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,power_law_1.01,0.03115519881248474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,4,power_law_1.2,0.06104320287704468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.01,0.2089792013168335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,balanced,0.055919999877611794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.01,0.28448638916015623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,power_law_1.01,0.038335999846458434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,4,power_law_1.2,0.0623744010925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.01,0.07150080204010009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,balanced,0.057904000083605446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.01,0.3672447919845581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,balanced,0.7097547054290771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,power_law_1.01,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.01,0.07457280158996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,4,power_law_1.2,0.06371200084686279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.01,0.5746560096740723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,power_law_1.01,0.04302079975605011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.01,0.694924783706665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.01,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,4,power_law_1.2,0.06616960167884826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.01,1.2356736183166503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,power_law_1.01,0.04395520091056824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.01,0.10784000158309937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,4,power_law_1.2,0.06855679750442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.01,1.8762880325317384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,balanced,0.06878399848937988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,power_law_1.01,0.047603198885917665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.01,0.12526079416275024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,4,power_law_1.2,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.01,1.788198471069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,power_law_1.01,0.04962559938430786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,balanced,0.07287999987602234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,balanced,1.1261653105417888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.01,0.1716096043586731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,4,power_law_1.2,0.07368320226669312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.01,3.318252944946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,power_law_1.01,0.052716797590255736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.01,0.18806400299072265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,4,power_law_1.2,0.0800383985042572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.01,5.511872100830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.01,0.25167999267578123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,4,power_law_1.2,0.08295680284500122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.01,0.31198079586029054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,4,power_law_1.2,0.09898880124092102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,power_law_1.01,0.052857601642608644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,4,power_law_1.2,0.10483839511871337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.01,0.5228544235229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,power_law_1.01,0.05336959958076477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,4,power_law_1.2,0.10945919752120972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.01,0.5791232109069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,power_law_1.01,0.06037120223045349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,balanced,0.09713066617647807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,4,power_law_1.2,0.1548095941543579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,power_law_1.01,0.0671999990940094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.01,0.8682623863220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,balanced,0.11010133226712544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,4,power_law_1.2,0.19544320106506347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,balanced,2.113349278767904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,4,power_law_1.2,0.23515520095825196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.01,1.1120896339416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,balanced,0.15402666727701822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,4,power_law_1.2,0.25886080265045164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.01,1.3195327758789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,power_law_1.01,0.07273600101470948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,balanced,0.19757866859436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,4,power_law_1.2,0.36267518997192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,power_law_1.01,0.07996799945831298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.01,2.3657663345336912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,4,power_law_1.2,0.5051775932312011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,balanced,0.3005173405011495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,power_law_1.01,0.09075199961662292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,4,power_law_1.2,0.5799359798431396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.01,4.07441291809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,balanced,0.4103519916534424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,4,power_law_1.2,0.8410431861877441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,power_law_1.01,0.09886720180511474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,4,power_law_1.2,0.9640704154968261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,power_law_1.01,0.13029119968414307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,4,power_law_1.2,1.6158655166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,4,power_law_1.2,2.075174331665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,power_law_1.01,0.19942400455474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,balanced,0.6161333322525024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,4,power_law_1.2,3.4736385345458984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,power_law_1.01,0.26743040084838865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,4,power_law_1.2,7.068851470947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,power_law_1.01,0.35445759296417234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,balanced,0.8118186791737875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,power_law_1.01,0.6001023769378662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,power_law_1.01,0.737171220779419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,4,power_law_1.2,0.040031999349594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,balanced,1.0099146366119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,power_law_1.01,0.9216256141662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,4,power_law_1.2,0.03914240002632141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,4,power_law_1.2,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,power_law_1.01,1.7226175308227538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,4,power_law_1.2,0.04335359930992126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,4,power_law_1.2,0.03246079981327057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,4,power_law_1.2,0.04470399916172028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,power_law_1.01,2.151532745361328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,4,power_law_1.2,0.04747520089149475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,balanced,1.592842737833659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,4,power_law_1.2,0.031411200761795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,power_law_1.01,2.466694450378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,4,power_law_1.2,0.049107199907302855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,4,power_law_1.2,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,4,power_law_1.2,0.0336896002292633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,power_law_1.01,4.8892158508300785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,4,power_law_1.2,0.05738880038261414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,4,power_law_1.2,0.03919999897480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,4,power_law_1.2,0.057657599449157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,power_law_1.01,8.082086181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,4,power_law_1.2,0.057120001316070555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,4,power_law_1.2,0.05974400043487549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,4,power_law_1.2,0.040294399857521056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,4,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,4,power_law_1.2,0.04307200014591217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,4,power_law_1.2,0.06291199922561645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,4,power_law_1.2,0.04821760058403015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,4,power_law_1.2,0.0707647979259491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,balanced,3.145109176635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,4,power_law_1.2,0.07882879972457886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,4,power_law_1.2,0.04933759868144989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,4,power_law_1.2,0.08286719918251037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,4,power_law_1.2,0.05010560154914856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,4,power_law_1.2,0.10988160371780395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,4,power_law_1.2,0.058406400680541995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,4,power_law_1.2,0.1356735944747925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,4,power_law_1.2,0.18945280313491822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,4,power_law_1.2,0.1983296036720276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,4,power_law_1.2,0.2800447940826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,4,power_law_1.2,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,4,power_law_1.2,0.35317120552062986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,4,power_law_1.2,0.49759998321533205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,4,power_law_1.2,0.056704002618789676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,4,power_law_1.2,0.6159167766571045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,4,power_law_1.2,0.05551999807357788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,4,power_law_1.2,0.9215488433837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,4,power_law_1.2,1.2748160362243652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,4,power_law_1.2,0.06572800278663635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,4,power_law_1.2,1.6843648910522462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,4,power_law_1.2,2.3409856796264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,4,power_law_1.2,0.07708799839019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,4,power_law_1.2,4.259552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,4,power_law_1.2,0.07173759937286377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,4,power_law_1.2,0.0939136028289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,4,power_law_1.2,0.11601279973983765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,4,power_law_1.2,0.12784639596939087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,4,power_law_1.2,0.21717119216918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,4,power_law_1.2,0.298688006401062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,4,power_law_1.2,0.4571904182434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,4,power_law_1.2,0.5321983814239502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,4,power_law_1.2,0.9320192337036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,balanced,0.031871999303499855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,4,power_law_1.2,1.2458111763000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,4,power_law_1.2,1.696793556213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,balanced,0.058101331194241844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,4,power_law_1.2,2.180012893676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,balanced,0.06030400097370148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,4,power_law_1.2,2.1736896514892576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,balanced,0.05981333553791046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,balanced,0.06195199986298879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,4,power_law_1.2,4.55011215209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,balanced,0.06193066636721293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,balanced,0.033786666889985405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,balanced,0.06180266539255778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,4,power_law_1.2,7.116057586669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,balanced,0.03640533238649368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,balanced,0.0432533323764801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,balanced,0.06155733267466227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,balanced,0.06188266475995382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,balanced,0.046298667788505554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,balanced,0.06280000011126201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,balanced,0.04773333172003428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,balanced,0.06404800216356914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,balanced,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,balanced,0.04911466439565023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,balanced,0.06378666559855144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,balanced,0.04945066571235657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,balanced,0.05050666630268097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,balanced,0.06516266862551372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.01,0.04037759900093078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,balanced,0.050383999943733215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,balanced,0.026650667190551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,balanced,0.07178666690985362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,balanced,0.051488002141316734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.01,0.04310399889945984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,balanced,0.0529013325770696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,balanced,0.07373866438865662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,balanced,0.028090665737787884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.01,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,balanced,0.05384000142415365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,balanced,0.03716800113519033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,balanced,0.07620800038178761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,balanced,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,balanced,0.06371200084686279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,balanced,0.0405973345041275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,balanced,0.09058133761088054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.01,0.05894399881362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,balanced,0.0661653329928716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,balanced,0.04105599969625473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,balanced,0.09314666191736858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,balanced,0.0766293356815974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.01,0.06047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,balanced,0.04211199780305227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.01,0.06113920211791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,balanced,0.08308800061543782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.01,0.061939197778701785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,balanced,0.12298666437466939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,balanced,0.04301866888999939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,balanced,0.10739200313886006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.01,0.06209920048713684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,balanced,0.11760532855987549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,balanced,0.042965332667032875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,balanced,0.13131733735402426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.01,0.06249600052833557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,balanced,0.1718453367551168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.01,0.06435199975967407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,balanced,0.19689599672953287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.01,0.06520320177078247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,balanced,0.21124267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,balanced,0.04534933467706045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.01,0.06744959950447083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,balanced,0.2184000015258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,balanced,0.30190932750701904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,balanced,0.0458133320013682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.01,0.07744640111923218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.01,0.09147520065307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,balanced,0.3121653397878011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.01,0.035411199927330016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,balanced,0.39284801483154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.01,0.08951039910316468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.01,0.03562879860401154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.01,0.09688320159912109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,balanced,0.40442665417989093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,balanced,0.5632746616999308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.01,0.035104000568389894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.01,0.12370560169219971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.01,0.042310398817062375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.01,0.14087040424346925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,balanced,0.5869706471761068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,balanced,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.01,0.04387199878692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.01,0.18145279884338378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,balanced,0.706063985824585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,balanced,0.048528000712394714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.01,0.0473471999168396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.01,0.20211200714111327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.01,0.04827519953250885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.01,0.27112319469451907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,balanced,0.04979733129342397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,balanced,0.7371253172556559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,balanced,0.8726239999135336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.01,0.32652161121368406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.01,0.049344000220298764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,balanced,0.051301335295041404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.01,0.4029695987701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.01,0.04814079999923706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.01,0.5470335960388184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.01,0.05325440168380737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,balanced,0.9425333340962728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.01,0.05220479965209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.01,0.9384639739990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,power_law_1.01,0.028812798857688903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,balanced,0.0598826656738917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,balanced,1.376405398050944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.01,0.05441920161247253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.01,1.1539903640747071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,balanced,0.0612960010766983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,power_law_1.01,0.028934401273727418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.01,0.05576320290565491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,power_law_1.01,0.02993920147418976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,balanced,0.06562666594982147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.01,1.4809023857116699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,power_law_1.01,0.03957119882106781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.01,0.06088320016860962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,power_law_1.01,0.04017919898033142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,balanced,1.429850737253825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.01,2.4859136581420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,2,power_law_1.2,0.0406464010477066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,power_law_1.01,0.044268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.01,0.06945919990539551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,power_law_1.01,0.04519039988517761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,2,power_law_1.2,0.039577600359916684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.01,4.343225479125977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.01,0.07241600155830383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,power_law_1.01,0.04599680006504059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,balanced,0.08098133405049641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,2,power_law_1.2,0.04618239998817444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.01,0.07752320170402527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,power_law_1.01,0.048511999845504764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,balanced,0.08833066622416179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,2,power_law_1.2,0.05979520082473755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,power_law_1.01,0.04979200065135956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.01,0.09359999895095825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,balanced,2.6757707595825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,2,power_law_1.2,0.05731840133666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.01,0.11037440299987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,2,power_law_1.2,0.061740797758102414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.01,0.13550080060958863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,power_law_1.01,0.0551360011100769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,2,power_law_1.2,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,balanced,0.11983467141787212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.01,0.15079679489135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,balanced,2.7726561228434243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,power_law_1.01,0.055027198791503903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,2,power_law_1.2,0.06343039870262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,balanced,0.14662933349609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.01,0.20824320316314698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,power_law_1.01,0.056652802228927615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,power_law_1.01,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,2,power_law_1.2,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.01,0.2576256036758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,balanced,0.22297066450119019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,2,power_law_1.2,0.06330879926681518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.01,0.3935744047164917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,power_law_1.01,0.06970880031585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,balanced,0.2924213409423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,2,power_law_1.2,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,power_law_1.01,0.07501440048217774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.01,0.5517824172973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,balanced,0.4272853136062622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,2,power_law_1.2,0.06675840020179749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,power_law_1.01,0.07869439721107482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.01,0.7568895816802979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,2,power_law_1.2,0.0666815996170044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.01,0.9089280128479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,balanced,0.5686666568120321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,power_law_1.01,0.1106112003326416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,2,power_law_1.2,0.0778432011604309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,power_law_1.01,0.12353279590606689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.01,1.0468544006347655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,2,power_law_1.2,0.09207040071487427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.01,2.225382423400879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,2,power_law_1.2,0.09651200175285339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,power_law_1.01,0.1796223998069763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,power_law_1.01,0.21978240013122557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,2,power_law_1.2,0.0988864004611969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.01,3.9189502716064455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,power_law_1.01,0.33103361129760744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,power_law_1.01,0.3899904012680054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,2,power_law_1.2,0.12013440132141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,balanced,0.8643093109130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,power_law_1.01,0.6417215824127197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,2,power_law_1.2,0.13984639644622804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,power_law_1.01,0.9267007827758789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,2,power_law_1.2,0.1745151996612549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,2,power_law_1.2,0.035046398639678955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,balanced,1.123306671778361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,power_law_1.01,1.168064022064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,2,power_law_1.2,0.19854079484939574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,power_law_1.01,1.5263808250427247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,2,power_law_1.2,0.03495680093765259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,2,power_law_1.2,0.25483520030975343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,power_law_1.01,1.8980415344238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,2,power_law_1.2,0.03654400110244751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,2,power_law_1.2,0.359878396987915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,balanced,1.390442689259847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,power_law_1.01,3.7174846649169924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,2,power_law_1.2,0.0420415997505188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,2,power_law_1.2,0.45985918045043944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,2,power_law_1.2,0.0438975989818573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,power_law_1.01,6.103635025024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,2,power_law_1.2,0.5527040004730225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,2,power_law_1.2,0.047628799080848695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,2,power_law_1.2,0.7635136127471924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,2,power_law_1.2,0.04888960123062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,balanced,2.2233972549438477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,2,power_law_1.2,0.04922240078449249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,2,power_law_1.2,1.2003968238830567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,2,power_law_1.2,0.051667201519012454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,2,power_law_1.2,1.6510591506958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,2,power_law_1.2,0.053574401140213015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,2,power_law_1.2,2.231520080566406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,2,power_law_1.2,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,2,power_law_1.2,0.05800319910049438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,2,power_law_1.2,4.927942276000977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,2,power_law_1.2,0.060147202014923094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,2,power_law_1.2,0.061952000856399535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,2,power_law_1.2,0.0692351996898651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,balanced,4.4005387624104815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,2,power_law_1.2,0.07461119890213012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,2,power_law_1.2,0.08428159952163697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,2,power_law_1.2,0.09548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,2,power_law_1.2,0.1136896014213562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,2,power_law_1.2,0.142086398601532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,2,power_law_1.2,0.16164480447769164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,2,power_law_1.2,0.20959360599517823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,2,power_law_1.2,0.2890624046325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,2,power_law_1.2,0.4358719825744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,2,power_law_1.2,0.5521152019500732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,2,power_law_1.2,0.706879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,2,power_law_1.2,1.0245823860168457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,2,power_law_1.2,1.22161922454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,2,power_law_1.2,2.107980728149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,2,power_law_1.2,4.124531173706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,2,power_law_1.2,0.028089600801467895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,balanced,0.0306986669699351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,2,power_law_1.2,0.029548799991607665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,balanced,0.04064533362785975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,2,power_law_1.2,0.029311999678611755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,balanced,0.05343999962011973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,2,power_law_1.2,0.03557760119438171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,balanced,0.05629333357016245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,2,power_law_1.2,0.03866240084171295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,2,power_law_1.2,0.043532800674438474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,balanced,0.06108800073464712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,balanced,0.033941333492596946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,2,power_law_1.2,0.04391680061817169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,balanced,0.05792533357938131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,2,power_law_1.2,0.046623998880386354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,balanced,0.03557866563399633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,balanced,0.058821335434913635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,balanced,0.04504533112049103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,2,power_law_1.2,0.04837760031223297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,balanced,0.06196799874305725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,balanced,0.048341333866119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,2,power_law_1.2,0.051046401262283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,balanced,0.06224533418814341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,balanced,0.048026666045188904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,balanced,0.0628959983587265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,balanced,0.04957866668701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,balanced,0.06425599753856659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,2,power_law_1.2,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,balanced,0.050383999943733215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,balanced,0.06642666459083557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,2,power_law_1.2,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,2,power_law_1.2,0.056441599130630495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,balanced,0.04937066634496053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,balanced,0.06688533226648967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,2,power_law_1.2,0.0625216007232666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,balanced,0.050000001986821495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,balanced,0.069541335105896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,balanced,0.08482666810353597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,balanced,0.05134400228659312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,2,power_law_1.2,0.07318400144577027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,balanced,0.08140799899895985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,balanced,0.05186133086681366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,2,power_law_1.2,0.07457280158996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,2,power_law_1.2,0.09038720130920411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,balanced,0.08398399750391643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,balanced,0.05474133292833964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,balanced,0.056464001536369324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,balanced,0.10269866387049358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,2,power_law_1.2,0.10695040225982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,balanced,0.10626133282979329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,balanced,0.05809600154558817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,2,power_law_1.2,0.13815679550170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,balanced,0.14178666472434998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,balanced,0.06764266888300578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.03390080034732819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,2,power_law_1.2,0.1919360041618347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,balanced,0.06771733363469441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,balanced,0.1612266699473063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.03844479918479919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,2,power_law_1.2,0.25236480236053466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,balanced,0.07202133536338806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.039468801021575926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,2,power_law_1.2,0.32023038864135744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,balanced,0.23452800512313843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,balanced,0.08906666437784831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.053337597846984865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,2,power_law_1.2,0.4626431941986084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.0611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,balanced,0.09524266918500264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,balanced,0.2857653299967448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,2,power_law_1.2,0.6687615871429443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.05804160237312317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,balanced,0.1239359974861145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,2,power_law_1.2,0.9308032035827637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,balanced,0.4060853322347005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,balanced,0.1450826625029246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.06267520189285278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,balanced,0.029285334050655365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.06446719765663148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,2,power_law_1.2,1.288377571105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,balanced,0.20734934012095133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,balanced,0.5249653259913126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,balanced,0.03881600002447764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.06528639793395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,2,power_law_1.2,1.8570175170898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.06727039813995361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,balanced,0.04271466533342997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,balanced,0.2706773281097412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.06755840182304382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,2,power_law_1.2,2.285772705078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,balanced,0.04273599882920583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,balanced,0.76418670018514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.0692031979560852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,balanced,0.04472533365090688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,balanced,0.40163731575012207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.07808640003204345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,2,power_law_1.2,3.7823040008544924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,balanced,0.04572799801826477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.08389120101928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,balanced,0.5278026660283407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,balanced,0.04567466676235199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,2,power_law_1.2,7.012076568603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,balanced,0.9712959925333658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.09045760035514831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.0945792019367218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.01,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.12083200216293336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,balanced,0.7698293526967367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,balanced,0.0487413356701533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.1198591947555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,balanced,1.2087360223134358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,balanced,0.04969066878159841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.01,0.043859198689460754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,power_law_1.01,0.02781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.1590783953666687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.01,0.043315199017524716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,balanced,0.9409920374552408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.18429440259933472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.01,0.049004799127578734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,power_law_1.01,0.029555198550224305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.25136001110076905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.01,0.049516800045967105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,power_law_1.01,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.30422399044036863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.01,0.049267199635505673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,balanced,1.9694719314575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,power_law_1.01,0.03902080059051514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,balanced,0.052469333012898765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,balanced,1.1725813547770183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.01,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.4106880187988281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,power_law_1.01,0.044038400053977966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,balanced,0.054714664816856384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.01,0.050432002544403075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.5297088146209716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,balanced,0.05782933533191681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,power_law_1.01,0.045491200685501096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.01,0.05308160185813904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.01,0.7705984115600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,balanced,0.05956799785296122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,power_law_1.01,0.047353601455688475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.01,0.05588480234146118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.01,1.0397631645202636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.01,0.056678402423858645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,balanced,1.89956267674764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.01,1.254099178314209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,power_law_1.01,0.048281601071357726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.01,0.06172800064086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.01,2.0236160278320314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,balanced,0.07252799967924754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.01,0.07058560252189636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,power_law_1.01,0.05007359981536865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,balanced,3.810858726501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,balanced,0.07550399998823802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.01,0.07623040080070495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.01,3.6000446319580077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.01,0.07709439992904663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,balanced,0.08165333171685536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,power_law_1.01,0.057196801900863646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.01,0.0979968011379242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,power_law_1.01,0.0597760021686554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.01,0.10584959983825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,power_law_1.01,0.06152960062026978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.01,0.1343616008758545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,balanced,0.10748266180356343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,power_law_1.01,0.06668800115585327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.01,0.15805439949035643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,balanced,3.835269292195638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.01,0.21948800086975098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.03196159899234772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,balanced,0.12099732955296834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,power_law_1.01,0.07834240198135375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.01,0.26890881061553956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,power_law_1.01,0.08268160223960877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.01,0.39543039798736573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,power_law_1.01,0.09095680117607116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.01,0.5210432052612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,balanced,0.19006399313608804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,power_law_1.01,0.11509120464324951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.06096000075340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.01,0.7476863861083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,balanced,0.24543466170628866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.01,0.13506560325622557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.058905601501464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.01,0.9767999649047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,balanced,0.3546239932378133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.01,0.2001215934753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.06146559715270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.01,1.1986175537109376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.01,0.2585344076156616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.0642304003238678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,balanced,0.4620586633682251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.01,0.36909439563751223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.01,1.9042943954467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.06478080153465271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.01,0.4758463859558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,balanced,0.6781493028004965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.01,0.6909696102142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.06509439945220948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.01,3.6350975036621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.01,0.8936832427978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.0675711989402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.01,1.3270463943481445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,balanced,0.8892373243967692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.0686784029006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.01,1.7517248153686524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.06967039704322815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.01,2.182099151611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,balanced,1.3320266405741374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,power_law_1.01,3.4595710754394533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.07675520181655884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.08320000171661376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,power_law_1.01,6.851705932617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,balanced,1.757893403371175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.09103999733924865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.089683198928833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.11363199949264527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,balanced,2.1834346453348794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.12332799434661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.15763200521469117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.1807360053062439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.2526335954666138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,balanced,3.47380797068278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.28732800483703613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.4147071838378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.5407360076904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,1,power_law_1.2,0.7734655857086181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,1,power_law_1.2,1.0133567810058595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,1,power_law_1.2,1.2812095642089845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,1,power_law_1.2,1.999718475341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,balanced,6.86634635925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,1,power_law_1.2,3.639206314086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.033228799700737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.0435263991355896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.04460160136222839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.049497601389884946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.05008000135421753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.05061759948730469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.050195199251174924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.053548800945281985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.055641597509384154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.05687040090560913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.063372802734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.07077119946479797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.07429760098457336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.07728000283241272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.10091520547866821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.10526080131530761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.13794560432434083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.1607103943824768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,balanced,0.0916426678498586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.22076799869537353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,balanced,0.07902400195598602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.2774143934249878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,balanced,0.0787360022465388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.39415678977966306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,balanced,0.08161599934101105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,0.5157887935638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,1,power_law_1.2,0.027968001365661622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,balanced,0.08460799853006999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,0.7504831790924072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,1,power_law_1.2,0.0286080002784729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,balanced,0.08433066805203755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,0.98155517578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,balanced,0.08328533172607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,1,power_law_1.2,0.03025279939174652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,balanced,0.05594133337338766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,1,power_law_1.2,1.2032832145690917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,balanced,0.08614933490753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,1,power_law_1.2,1.9258560180664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,1,power_law_1.2,0.039955198764801025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,balanced,0.059578667084376015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,balanced,0.08358400066693623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,1,power_law_1.2,0.04158720076084137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,1,power_law_1.2,3.6245185852050783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,balanced,0.05739733576774597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,balanced,0.08424533406893413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,1,power_law_1.2,0.04420480132102966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,balanced,0.06057066718737284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,balanced,0.08851733803749084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,1,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,balanced,0.06038933495680491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,balanced,0.08737066388130188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,1,power_law_1.2,0.047679999470710756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,balanced,0.061237335205078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,balanced,0.08620799581209819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,balanced,0.08678932984670003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,balanced,0.06282666822274525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,1,power_law_1.2,0.04865919947624207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,balanced,0.1099679966767629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,balanced,0.06267733375231425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,1,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,balanced,0.10992532968521118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,balanced,0.06079466640949249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,balanced,0.09918399651845296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,balanced,0.06316799918810527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,balanced,0.12461866935094197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,balanced,0.06427200138568878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,1,power_law_1.2,0.057043200731277464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,balanced,0.12204800049463908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,balanced,0.0628959983587265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,1,power_law_1.2,0.05983359813690185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,balanced,0.19182399908701578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,balanced,0.06444799900054932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,1,power_law_1.2,0.06119679808616638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,balanced,0.06577066580454509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,balanced,0.1528320014476776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,balanced,0.07805866499741872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,1,power_law_1.2,0.06699519753456115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,balanced,0.053957333167394005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.01,0.09038720130920411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,balanced,0.26321067412694293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,balanced,0.07884799937407176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,1,power_law_1.2,0.0779583990573883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,balanced,0.07853866616884868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.01,0.07857919931411743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,balanced,0.26708799600601196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,balanced,0.04950400193532308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,1,power_law_1.2,0.08225280046463013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,balanced,0.049786667029062905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.01,0.07998080253601074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,balanced,0.0943946639696757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,balanced,0.05303466816743215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,1,power_law_1.2,0.09178239703178406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,balanced,0.3842879931131999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,balanced,0.09508267045021057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.01,0.0828224003314972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,balanced,0.05342400074005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,balanced,0.05399466554323832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,balanced,0.1426293353239695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,1,power_law_1.2,0.1167680025100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.01,0.08183040022850037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,balanced,0.4952640136082967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,balanced,0.05514666438102722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.01,0.08520320057868958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.2,0.13645440340042114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,balanced,0.14698666334152222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,balanced,0.05445333321889242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.01,0.09008640050888062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,balanced,0.058415999015172325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,balanced,0.7466506958007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,balanced,0.22184000412623087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,balanced,0.05903466542561849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.2,0.1997696042060852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.01,0.08737279772758484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.01,0.10020480155944825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.2,0.25896320343017576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,balanced,0.2233333388964335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,balanced,0.9313013553619385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.2,0.3678143978118896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.01,0.10610560178756714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,balanced,0.3185759981473287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.2,0.475980806350708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.01,0.09286400079727172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.2,0.6931968212127686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.01,0.0990015983581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,balanced,0.4010719855626424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,balanced,1.2073226769765217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.2,0.8969535827636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.01,0.11016319990158081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,balanced,0.05885866781075796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.01,0.05651199817657471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.2,1.331167984008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.01,0.1227455973625183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,balanced,0.06052266558011373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.01,0.05898879766464234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,balanced,0.5899786551793417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.2,1.7531967163085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.01,0.16824320554733277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,balanced,0.05962666869163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.01,0.05486720204353333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.01,0.18557440042495726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.2,2.1866943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,power_law_1.01,0.052716797590255736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.01,0.05927039980888367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,balanced,1.8418933550516765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.01,0.19756799936294556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.01,0.05859839916229248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,1,power_law_1.2,3.468159866333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,balanced,0.769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,power_law_1.01,0.04891520142555237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.01,0.06064000129699707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.01,0.32425599098205565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.01,0.07041919827461243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,power_law_1.01,0.04924800097942352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.01,0.31614079475402834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,1,power_law_1.2,6.867289733886719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.01,0.06376960277557372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,power_law_1.01,0.05203840136528015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,balanced,0.06805866460005443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.01,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,power_law_1.01,0.05275520086288452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,balanced,0.9720533688863119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.01,0.4654528141021729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.01,0.06578559875488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,balanced,0.06878399848937988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,power_law_1.01,0.057062399387359616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.01,0.06611199975013733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.01,0.43724799156188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,balanced,0.07070399820804596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,power_law_1.01,0.06364160180091857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.01,0.07538560032844543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.01,0.07877119779586791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.01,0.5277503967285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,balanced,3.5826187133789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.01,0.08692479729652405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,power_law_1.01,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.01,0.11407359838485717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,balanced,1.502618630727132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.01,0.8328639984130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.01,0.1192512035369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,power_law_1.01,0.0778432011604309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.01,0.13408000469207765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.01,1.2644864082336427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,power_law_1.01,0.08887040019035339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.01,0.17804160118103027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.01,1.336672019958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.01,0.2018496036529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,balanced,0.0836906631787618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.01,0.27150719165802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.01,2.475833511352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.01,0.3901632070541382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,balanced,0.08774933218955994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,power_law_1.01,0.06821759939193725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.01,0.5409279823303222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.01,2.978816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.01,0.5230016231536865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,power_law_1.01,0.07593600153923034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.01,0.69552640914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.01,3.8825023651123045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,power_law_1.01,0.07969279885292054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.01,1.0600255966186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,balanced,2.937840143839518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,power_law_1.01,0.09889280200004577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.01,6.386572647094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.01,1.5582271575927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.01,2.2251712799072267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,balanced,0.11950400471687317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.01,12.44949722290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.01,2.8836992263793944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,balanced,0.13966400424639383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,power_law_1.01,0.10643199682235718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.01,3.8158912658691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,power_law_1.01,0.12076799869537354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,balanced,0.1983413298924764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,power_law_1.01,0.13688960075378417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.01,8.033612823486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,balanced,0.2291839917500814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,power_law_1.01,0.17048959732055663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,4,8,power_law_1.2,0.07904639840126038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,power_law_1.01,0.21036159992218018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,4,8,power_law_1.2,0.07874559760093688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,balanced,0.3451840082804362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,4,8,power_law_1.2,0.07930880188941955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,4,8,power_law_1.2,0.08303359746932984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,balanced,0.46074668566385907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,power_law_1.01,0.349452805519104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,4,8,power_law_1.2,0.08165119886398316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,power_law_1.01,0.37792000770568845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,4,8,power_law_1.2,0.0864960014820099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,balanced,0.7004160086313883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,power_law_1.01,0.7197375774383545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,4,8,power_law_1.2,0.0901632010936737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,4,8,power_law_1.2,0.08755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,power_law_1.01,0.8413567543029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,balanced,0.917242685953776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,4,8,power_law_1.2,0.10497280359268188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,power_law_1.01,1.3376704216003419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,4,8,power_law_1.2,0.10022399425506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,power_law_1.01,1.5858752250671386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,balanced,1.1430559953053792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,4,8,power_law_1.2,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,power_law_1.01,2.3227712631225588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,4,8,power_law_1.2,0.11822719573974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,4,8,power_law_1.2,0.11442559957504272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,power_law_1.01,3.1183551788330077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,4,8,power_law_1.2,0.13184640407562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,power_law_1.01,4.136179351806641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,balanced,1.8025867144266765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,4,8,power_law_1.2,0.16967040300369263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,power_law_1.01,6.167552185058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,4,8,power_law_1.2,0.1581055998802185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,4,8,power_law_1.2,0.20476799011230468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,power_law_1.01,12.906719970703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,4,8,power_law_1.2,0.29115519523620603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,4,8,power_law_1.2,0.3344448089599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,4,8,power_law_1.2,0.4653439998626709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,balanced,3.541520118713379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,4,8,power_law_1.2,0.42731518745422364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,4,8,power_law_1.2,0.5932415962219239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,4,8,power_law_1.2,0.8144831657409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,4,8,power_law_1.2,1.1835712432861327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,4,8,power_law_1.2,1.5513216018676759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,4,8,power_law_1.2,2.1386240005493162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,4,8,power_law_1.2,3.275910568237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,4,8,power_law_1.2,4.084083175659179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,4,8,power_law_1.2,5.639769744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,4,8,power_law_1.2,12.59810562133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,4,8,power_law_1.2,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,4,8,power_law_1.2,0.05920640230178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,4,8,power_law_1.2,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,4,8,power_law_1.2,0.05883520245552063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,4,8,power_law_1.2,0.0587007999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,4,8,power_law_1.2,0.06110079884529114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,4,8,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,4,8,power_law_1.2,0.06416640281677247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,4,8,power_law_1.2,0.06568959951400757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,4,8,power_law_1.2,0.07206400036811829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,4,8,power_law_1.2,0.06766719818115234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,4,8,power_law_1.2,0.07351679801940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,4,8,power_law_1.2,0.0761023998260498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,4,8,power_law_1.2,0.08856959939002991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,4,8,power_law_1.2,0.0486272007226944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,4,8,power_law_1.2,0.09818879961967468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,4,8,power_law_1.2,0.11914240121841431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,4,8,power_law_1.2,0.04848639965057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,4,8,power_law_1.2,0.12583039999008178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,4,8,power_law_1.2,0.04911360144615173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,4,8,power_law_1.2,0.18802560567855836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,balanced,0.05912533402442932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,4,8,power_law_1.2,0.05286399722099304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,4,8,power_law_1.2,0.18645119667053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,balanced,0.055258666475613914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,4,8,power_law_1.2,0.053011202812194826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,4,8,power_law_1.2,0.27657599449157716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,balanced,0.04462933540344238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,4,8,power_law_1.2,0.3903872013092041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,balanced,0.08175999919573466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,4,8,power_law_1.2,0.05731840133666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,balanced,0.04407466451327006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,4,8,power_law_1.2,0.5507199764251709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,balanced,0.08436266581217448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,4,8,power_law_1.2,0.06969599723815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,4,8,power_law_1.2,0.5539455890655518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,4,8,power_law_1.2,0.8153152465820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,4,8,power_law_1.2,0.07214720249176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,balanced,0.08488000432650249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,balanced,0.0595413347085317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,4,8,power_law_1.2,1.1111231803894044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,4,8,power_law_1.2,0.0796288013458252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,balanced,0.08517866333325703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,4,8,power_law_1.2,1.6847488403320312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,balanced,0.059008002281188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,4,8,power_law_1.2,0.09441919922828675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,balanced,0.08586666981379192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,4,8,power_law_1.2,2.2820287704467774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,balanced,0.06052800019582113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,balanced,0.08674666285514832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,4,8,power_law_1.2,2.880588722229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,balanced,0.06195733447869619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,balanced,0.08397333820660909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,4,8,power_law_1.2,3.765036773681641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,4,8,power_law_1.2,0.06954240202903747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,balanced,0.06144533554712931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,balanced,0.08576533198356628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,4,8,power_law_1.2,0.07790719866752624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,4,8,power_law_1.2,7.703788757324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,balanced,0.06292266647020976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,balanced,0.08924800157546997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,4,8,power_law_1.2,0.0873856008052826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,balanced,0.03524799893299738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,balanced,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,balanced,0.0860053300857544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,4,8,power_law_1.2,0.10045440196990967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,balanced,0.04926399886608124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,balanced,0.0631573349237442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,balanced,0.08616000413894653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,balanced,0.052832002441088356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,balanced,0.06548800071080525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,balanced,0.08799466490745544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,balanced,0.052570665876070656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,balanced,0.06740800042947133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,balanced,0.10151466727256775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,4,8,power_law_1.2,0.11582080125808716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,balanced,0.05384000142415365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,balanced,0.07635733485221863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,balanced,0.10169066985448201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,4,8,power_law_1.2,0.12188160419464111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,balanced,0.05518933137257894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,balanced,0.10276266932487488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,balanced,0.07718933125336964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,4,8,power_law_1.2,0.1568511962890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,balanced,0.05443733433882395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,balanced,0.08122666676839192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,balanced,0.12147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,balanced,0.09382399916648865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,balanced,0.13244266311327615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,4,8,power_law_1.2,0.17781120538711548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,balanced,0.10019200046857198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,balanced,0.1646986703077952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,balanced,0.05612266560395559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,4,8,power_law_1.2,0.2374336004257202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,balanced,0.05699733396371206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.01,0.06601600050926208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,balanced,0.137061337629954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,balanced,0.20189332962036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,balanced,0.15566399693489075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.01,0.06988160014152527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,balanced,0.2644266684850057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,balanced,0.21493866046269736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.01,0.07420160174369812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,4,8,power_law_1.2,0.38775680065155027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,balanced,0.3094720045725505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,4,8,power_law_1.2,0.4656064033508301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.01,0.08301439881324768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,balanced,0.25920534133911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,balanced,0.4378933509190877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,4,8,power_law_1.2,0.7403391838073731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.01,0.08362240195274354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,balanced,0.05774400134881338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,balanced,0.3667200009028117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,4,8,power_law_1.2,0.887116813659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.01,0.08472319841384887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,balanced,0.5088106791178385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,balanced,0.058821335434913635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.01,0.0876800000667572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,balanced,0.4463520050048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,balanced,0.06083733340104421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,4,8,power_law_1.2,1.3107328414916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.01,0.05307520031929016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,balanced,0.061343997716903687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,balanced,0.7451093196868896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.01,0.08866559863090515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,4,8,power_law_1.2,1.7319232940673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.01,0.054662400484085084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.01,0.08805760145187377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,balanced,0.6483733256657919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.01,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,4,8,power_law_1.2,2.5350528717041017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.01,0.08885759711265565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.01,0.05857920050621033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,balanced,0.9844426314036051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,4,8,power_law_1.2,3.2169216156005858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.01,0.058841598033905027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.01,0.099891197681427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.01,0.06135680079460144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,balanced,0.837013324101766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.01,0.10247039794921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,4,8,power_law_1.2,4.111315155029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.01,0.06113280057907104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.01,0.06321280002593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.01,0.10302720069885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,balanced,0.07009600102901459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,balanced,1.2321013609568279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,4,8,power_law_1.2,6.7797119140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.01,0.06494719982147217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.01,0.1152448058128357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,balanced,0.07214933137098949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.01,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,balanced,1.0345439910888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.01,0.13173120021820067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.01,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,balanced,0.07413866619269054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,4,8,power_law_1.2,13.593344116210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.01,0.07269759774208069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.01,0.14657280445098878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,balanced,0.09124267101287842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.01,0.07269120216369629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.01,0.1463744044303894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,balanced,1.9076746304829915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,balanced,0.09873066345850627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.01,0.08602880239486695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.01,0.19713280200958253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.01,0.09177600145339966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.01,0.22040960788726807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.01,0.10682879686355591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,balanced,1.6503520011901855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.01,0.10682239532470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.01,0.26968960762023925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.01,0.13137279748916625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,balanced,0.1322986682256063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.01,0.40087041854858396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.01,0.16661759614944457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.01,0.2695103883743286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,balanced,0.15941866238911948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.01,0.5693503856658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.01,0.22376959323883056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.01,0.6375679969787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.01,0.4074560165405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.01,0.49334402084350587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.01,1.1016832351684571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,balanced,3.7554985682169595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.01,0.6350656032562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.01,1.0051456451416017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.01,0.8015551567077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,balanced,0.23426665862401327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,power_law_1.01,0.04046080112457275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.01,1.353222370147705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.01,2.0254655838012696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,balanced,3.182170550028483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.01,1.8199871063232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,power_law_1.01,0.04337919950485229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,balanced,0.30962133407592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.01,2.4958463668823243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.01,2.4037120819091795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,power_law_1.01,0.052172797918319705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.01,3.5674816131591798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,power_law_1.01,0.050470399856567386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.01,4.042150497436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,balanced,0.46482666333516437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,power_law_1.01,0.05780479907989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.01,7.319904327392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.01,4.600812911987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,power_law_1.01,0.057107198238372806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,balanced,0.6133173306783041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,power_law_1.01,0.06808320283889771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.01,10.088140869140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,balanced,0.9187306563059489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,power_law_1.01,0.06788480281829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,power_law_1.01,0.070387202501297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,balanced,1.2161119778951008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,power_law_1.01,0.06849279999732971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,power_law_1.01,0.07245439887046815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,balanced,1.5314879417419434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,power_law_1.01,0.07708160281181335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,power_law_1.01,0.08755840063095092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,4,power_law_1.2,0.07088000178337098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,balanced,2.4298879305521646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,power_law_1.01,0.09160959720611572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,4,power_law_1.2,0.07514879703521729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,4,power_law_1.2,0.06947839856147767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,power_law_1.01,0.10588799715042115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,4,power_law_1.2,0.08346880078315735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,4,power_law_1.2,0.08306559920310974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,power_law_1.01,0.12370560169219971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,4,power_law_1.2,0.08478080034255982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,power_law_1.01,0.15411839485168458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,4,power_law_1.2,0.09057279825210571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,power_law_1.01,0.19729280471801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,4,power_law_1.2,0.08786560297012329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,4,power_law_1.2,0.09434880018234253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,power_law_1.01,0.2689471960067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,4,power_law_1.2,0.09201920032501221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,4,power_law_1.2,0.09818239808082581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,power_law_1.01,0.36750719547271726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,balanced,4.835935910542806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,4,power_law_1.2,0.10581760406494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,4,power_law_1.2,0.105132794380188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,power_law_1.01,0.5029248237609864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,4,power_law_1.2,0.12538880109786987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,power_law_1.01,0.8361023902893067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,4,power_law_1.2,0.14039679765701293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,4,power_law_1.2,0.14926079511642457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,power_law_1.01,0.9733951568603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,4,power_law_1.2,0.16785919666290283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,power_law_1.01,1.4166975975036622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,4,power_law_1.2,0.19777920246124267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,4,power_law_1.2,0.22984960079193115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,power_law_1.01,2.6231103897094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,4,power_law_1.2,0.2911231994628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,power_law_1.01,3.1303552627563476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,4,power_law_1.2,0.42958722114562986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,power_law_1.01,3.8502079010009767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,4,power_law_1.2,0.6006656169891358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,4,power_law_1.2,0.6955071926116944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,power_law_1.01,6.939174652099609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,4,power_law_1.2,0.9954879760742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,4,power_law_1.2,1.3958911895751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,power_law_1.01,10.582745361328126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,4,power_law_1.2,1.6419456481933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,4,power_law_1.2,3.4507774353027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,4,power_law_1.2,3.3214527130126954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,4,power_law_1.2,5.5534015655517575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,4,power_law_1.2,11.596633911132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,4,power_law_1.2,0.052825599908828735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,4,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,4,power_law_1.2,0.051686400175094606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,4,power_law_1.2,0.05737599730491638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,4,power_law_1.2,0.057817602157592775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,4,power_law_1.2,0.06048640012741089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,4,power_law_1.2,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,4,power_law_1.2,0.06314880251884461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,4,power_law_1.2,0.06297600269317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,4,power_law_1.2,0.0656000018119812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,4,power_law_1.2,0.06896640062332153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,4,power_law_1.2,0.07251840233802795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,4,power_law_1.2,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,4,power_law_1.2,0.04990079998970032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,4,power_law_1.2,0.08388479948043823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,4,power_law_1.2,0.041094401478767396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,4,power_law_1.2,0.09515519738197327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,4,power_law_1.2,0.04930559992790222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,4,power_law_1.2,0.10648319721221924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,balanced,0.045408000548680626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,4,power_law_1.2,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,4,power_law_1.2,0.10432640314102173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,4,power_law_1.2,0.14813439846038817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,4,power_law_1.2,0.05265920162200928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,balanced,0.05505066613356272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,balanced,0.03664533297220866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,4,power_law_1.2,0.18180480003356933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,4,power_law_1.2,0.05616000294685364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,balanced,0.07829333345095317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,4,power_law_1.2,0.27578880786895754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,4,power_law_1.2,0.059443199634552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,balanced,0.04005333284536997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,balanced,0.05585599939028422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,4,power_law_1.2,0.06280959844589233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,4,power_law_1.2,0.2954495906829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,balanced,0.08260799944400787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,balanced,0.06017066538333893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,4,power_law_1.2,0.3669568061828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,balanced,0.0823466678460439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,4,power_law_1.2,0.06941440105438232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,4,power_law_1.2,0.5377600193023682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,balanced,0.05962666869163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,balanced,0.06084799766540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,4,power_law_1.2,0.7794816017150878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,balanced,0.08354666829109192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,4,power_law_1.2,0.06908800005912781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,balanced,0.06298133234182994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,balanced,0.08526399731636047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,4,power_law_1.2,0.9302463531494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,balanced,0.08472533027331035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,balanced,0.06230400005976359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,4,power_law_1.2,1.246572780609131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,balanced,0.08435733119646709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,4,power_law_1.2,0.06712960004806519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,balanced,0.061754668752352394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,balanced,0.08586133519808452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,4,power_law_1.2,1.762175941467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,balanced,0.06369066735108693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,4,power_law_1.2,0.0742143988609314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,balanced,0.08591467142105103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,balanced,0.06586133440335591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,4,power_law_1.2,0.07631999850273133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,4,power_law_1.2,2.628927993774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,balanced,0.08714666962623596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,balanced,0.065461332599322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,4,power_law_1.2,0.09076480269432068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,balanced,0.088319996992747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,4,power_law_1.2,4.17523193359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,balanced,0.06779199838638306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,balanced,0.09297600388526917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,4,power_law_1.2,7.012729644775391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,balanced,0.07130666573842366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,balanced,0.030026666820049286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,balanced,0.10338667035102844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,4,power_law_1.2,0.08942720293998718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,balanced,0.10300800204277039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,balanced,0.0778186668952306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,balanced,0.03366933266321818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,balanced,0.10796800255775452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,4,power_law_1.2,0.11236480474472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,balanced,0.0790826678276062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,balanced,0.049135997891426086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,balanced,0.1264639993508657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,4,power_law_1.2,0.12617599964141846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,balanced,0.08434666196505229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,balanced,0.05333333214124044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,balanced,0.1458239952723185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,4,power_law_1.2,0.1713152050971985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,balanced,0.1006773312886556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,balanced,0.05301866432030996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,4,power_law_1.2,0.226310396194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,balanced,0.05445333321889242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,balanced,0.17199466625849405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,balanced,0.11658666531244914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,balanced,0.055904000997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,balanced,0.21414399147033691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,balanced,0.14474667112032572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,balanced,0.05566399792830149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,4,power_law_1.2,0.34872961044311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,balanced,0.2897493243217468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.01,0.055180799961090085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,4,power_law_1.2,0.4637184143066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,balanced,0.16676799456278482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,balanced,0.3166933258374532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,balanced,0.23813333113988241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.01,0.050783997774124144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,balanced,0.05797866483529409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,4,power_law_1.2,0.540992021560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.01,0.05364480018615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,balanced,0.059263999263445534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,balanced,0.4633013407389323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,balanced,0.2871999939282735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,4,power_law_1.2,0.7444479942321778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.01,0.08293120265007019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,4,power_law_1.2,0.9651264190673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,balanced,0.41041600704193115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.01,0.08097280263900757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,balanced,0.6073066790898641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.01,0.08234879970550538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,4,power_law_1.2,1.6658496856689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,balanced,0.5300800005594889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.01,0.08313599824905396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,balanced,0.9029546578725179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,4,power_law_1.2,2.8519039154052734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.01,0.08355200290679932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,balanced,0.06021333237489065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,4,power_law_1.2,2.935379219055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.01,0.08591359853744507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,balanced,0.7622400124867758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,balanced,0.06294933458169301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,balanced,1.1546239852905273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,4,power_law_1.2,3.588959884643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.01,0.08701440095901489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,balanced,0.06487999856472015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.01,0.08693119883537292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,balanced,0.066021333138148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,4,power_law_1.2,6.908755493164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,balanced,1.0046559969584148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.01,0.09096320271492005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,balanced,1.4501439730326335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.01,0.09452160000801087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,4,power_law_1.2,12.796294403076171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.01,0.10618879795074462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.01,0.03966079950332642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,balanced,1.2521119912465413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.01,0.12116479873657227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.01,0.04509440064430237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.01,0.04533120095729828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.01,0.1283455967903137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.01,0.0590719997882843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,balanced,0.07727999985218048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.01,0.12762240171432496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,balanced,2.2242453893025718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.01,0.06001920104026794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,balanced,0.07955199976762135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.01,0.16552319526672363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,power_law_1.01,0.035231998562812804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.01,0.05875840187072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.01,0.062035202980041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,balanced,1.9812426567077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,balanced,0.08578667044639587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.01,0.16420480012893676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,power_law_1.01,0.03548159897327423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.01,0.061766397953033444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,balanced,0.10880000392595927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.01,0.23972480297088622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.01,0.06307200193405152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,power_law_1.01,0.038406398892402646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.01,0.06451839804649354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,balanced,0.11935466527938843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.01,0.2979712009429932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,power_law_1.01,0.053420799970626834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.01,0.06570879817008972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.01,0.3699903964996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.01,0.07312639951705932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,power_law_1.01,0.05364480018615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.01,0.07190399765968322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.01,0.46586241722106936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.01,0.0745024025440216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,power_law_1.01,0.0549888014793396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.01,0.08178560137748718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.01,0.7284287929534912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,balanced,4.339834531148274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,power_law_1.01,0.05885440111160278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.01,0.09463679790496826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.01,0.9012031555175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.01,0.10540159940719604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,balanced,4.075381278991699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,power_law_1.01,0.060224002599716185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.01,1.3141056060791017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,balanced,0.17568532625834146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.01,0.12287360429763794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.01,1.6823871612548829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.01,0.1276095986366272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,balanced,0.22690133253733316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.01,0.18165760040283202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.01,2.5374656677246095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,power_law_1.01,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.01,0.23244800567626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,balanced,0.3330933252970378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.01,3.280883026123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.01,0.3277631998062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,balanced,0.4347519874572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.01,0.3831615924835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.01,6.7306365966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.01,0.5515007972717285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,power_law_1.01,0.06970880031585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,balanced,0.6411946614583334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.01,0.696665620803833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,power_law_1.01,0.07330560088157653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.01,1.0336000442504882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,power_law_1.01,0.0750656008720398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,balanced,0.8511040210723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.01,1.3077312469482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,power_law_1.01,0.07953919768333435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.01,1.8312959671020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,balanced,1.2652426560719807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,power_law_1.01,0.0923904001712799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.01,2.6945152282714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,power_law_1.01,0.09322879910469055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.01,6.479987335205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,balanced,1.6839787165323894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,power_law_1.01,0.12414720058441162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,power_law_1.01,0.14988800287246704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,balanced,2.0978026390075684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,power_law_1.01,0.19693440198898315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,power_law_1.01,0.2838848114013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,power_law_1.01,0.3258687973022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,balanced,3.319792111714681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,power_law_1.01,0.5320256233215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,power_law_1.01,0.6701632022857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,2,power_law_1.2,0.052697598934173584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,power_law_1.01,0.9855104446411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,2,power_law_1.2,0.0515392005443573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,power_law_1.01,1.2551679611206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,2,power_law_1.2,0.05432959794998169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,2,power_law_1.2,0.0805184006690979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,power_law_1.01,1.8635456085205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,2,power_law_1.2,0.08022400140762329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,power_law_1.01,2.4863231658935545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,2,power_law_1.2,0.07991679906845092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,balanced,6.590917587280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,2,power_law_1.2,0.0828224003314972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,power_law_1.01,3.0155839920043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,2,power_law_1.2,0.08436480164527893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,2,power_law_1.2,0.08711040019989014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,power_law_1.01,5.315910339355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,2,power_law_1.2,0.088019198179245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,2,power_law_1.2,0.08819199800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,2,power_law_1.2,0.09063680171966552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,power_law_1.01,9.167430114746093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,2,power_law_1.2,0.09477760195732117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,2,power_law_1.2,0.10022399425506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,2,power_law_1.2,0.11866240501403809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,2,power_law_1.2,0.13033599853515626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,2,power_law_1.2,0.11771520376205444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,2,power_law_1.2,0.17059199810028075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,2,power_law_1.2,0.20371201038360595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,2,power_law_1.2,0.22037119865417482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,2,power_law_1.2,0.3154239892959595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,2,power_law_1.2,0.3842816114425659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,2,power_law_1.2,0.5100736141204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,2,power_law_1.2,0.7634496212005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,2,power_law_1.2,0.8788352012634277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,2,power_law_1.2,1.4156800270080567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,2,power_law_1.2,2.0824832916259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,2,power_law_1.2,2.301350402832031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,2,power_law_1.2,3.7538814544677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,2,power_law_1.2,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,2,power_law_1.2,8.25854721069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,2,power_law_1.2,0.04509440064430237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,2,power_law_1.2,0.04534400105476379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,2,power_law_1.2,0.05862399935722351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,2,power_law_1.2,0.05975679755210876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,2,power_law_1.2,0.0603007972240448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,2,power_law_1.2,0.0615231990814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,2,power_law_1.2,0.0624064028263092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,2,power_law_1.2,0.06377599835395813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,2,power_law_1.2,0.06396160125732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,balanced,0.05422399938106537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,2,power_law_1.2,0.06527360081672669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,2,power_law_1.2,0.07169920206069946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,balanced,0.055018668373425804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,2,power_law_1.2,0.07573760151863099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,balanced,0.08017600079377492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,2,power_law_1.2,0.08227840065956116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,2,power_law_1.2,0.036057600378990175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,balanced,0.08133333424727122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,2,power_law_1.2,0.09214720129966736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,2,power_law_1.2,0.03650560081005096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,2,power_law_1.2,0.09580159783363343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,balanced,0.08246933420499165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,2,power_law_1.2,0.10167039632797241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,2,power_law_1.2,0.03684479892253876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,2,power_law_1.2,0.12242560386657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,balanced,0.08410666386286418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,balanced,0.042853335539499916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,2,power_law_1.2,0.05204480290412903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,2,power_law_1.2,0.1258239984512329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,balanced,0.08427733182907104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,2,power_law_1.2,0.17203840017318725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,2,power_law_1.2,0.05374079942703247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,balanced,0.04058133314053217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,2,power_law_1.2,0.20873599052429198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,balanced,0.08536000053087871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,2,power_law_1.2,0.33194880485534667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,2,power_law_1.2,0.05557119846343994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,balanced,0.08584533135096233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,2,power_law_1.2,0.3752255916595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,2,power_law_1.2,0.057715201377868654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,2,power_law_1.2,0.5475391864776611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,balanced,0.08675733208656311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,balanced,0.05961066484451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,2,power_law_1.2,0.7978879928588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,2,power_law_1.2,0.06273279786109924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,balanced,0.09101866682370503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,2,power_law_1.2,1.1121536254882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,balanced,0.05958933134873708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,balanced,0.09240000446637471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,2,power_law_1.2,1.4840127944946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,balanced,0.06107733150323232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,2,power_law_1.2,0.06362239718437195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,2,power_law_1.2,2.0106815338134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,balanced,0.09238400061925252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,balanced,0.06258666515350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,2,power_law_1.2,0.06807039976119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,2,power_law_1.2,3.050815963745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,balanced,0.09918399651845296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,balanced,0.061568001906077065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,2,power_law_1.2,6.271475219726563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,balanced,0.10442666212717693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,balanced,0.06292266647020976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,2,power_law_1.2,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,balanced,0.10672000050544739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,balanced,0.11927466591199239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,2,power_law_1.2,0.0725055992603302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,balanced,0.06489066779613495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,balanced,0.13808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,2,power_law_1.2,0.0763647973537445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,balanced,0.032144000132878624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,balanced,0.06648533542950948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,2,power_law_1.2,0.08314239978790283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,balanced,0.1556426684061686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,balanced,0.03646933287382126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,balanced,0.06962666908899943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,balanced,0.19292799631754556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,balanced,0.05136000116666158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,balanced,0.07203199962774913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,balanced,0.054661333560943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,balanced,0.25979199012120563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,2,power_law_1.2,0.09256960153579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,balanced,0.07437866429487865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,balanced,0.055349335074424744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,2,power_law_1.2,0.10313600301742554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,balanced,0.3516480127970378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,balanced,0.05705599983533224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,balanced,0.08386133114496867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,2,power_law_1.2,0.11984000205993653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,balanced,0.06028266747792562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,balanced,0.08539199829101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,balanced,0.44650665918986004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,2,power_law_1.2,0.14696320295333862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,balanced,0.05951466659704844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,2,power_law_1.2,0.19467519521713256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,balanced,0.09830400347709656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.055103999376296994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,balanced,0.6299253304799398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,balanced,0.1156213382879893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.047302401065826415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,balanced,0.0617439995209376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,balanced,0.1295093297958374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,balanced,0.7413547039031982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,2,power_law_1.2,0.29146881103515626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.053337597846984865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,balanced,0.16591999928156534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,balanced,0.06379200021425883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,2,power_law_1.2,0.3759615898132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.08091520071029663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,balanced,0.2174826661745707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,2,power_law_1.2,0.4972991943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,balanced,1.1007786591847737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.07872639894485474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,2,power_law_1.2,0.6700223922729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,balanced,0.3099199930826823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.08305919766426087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,2,power_law_1.2,1.1257856369018555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,balanced,0.39390401045481366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.04327679872512817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.08279039859771728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,balanced,1.5034666061401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,2,power_law_1.2,1.3899007797241212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,balanced,0.06855466465155284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.08617600202560424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.039078399538993835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,balanced,0.5626346667607626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,2,power_law_1.2,2.240889549255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,balanced,0.07195733487606049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.08664960265159607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.041228801012039185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,balanced,0.07550399998823802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,balanced,1.886090596516927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.08657919764518737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,2,power_law_1.2,2.876838493347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,balanced,0.6789653301239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.058508801460266116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.08970879912376403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,balanced,0.0790880024433136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.059564799070358276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,2,power_law_1.2,3.3533119201660155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.09340800046920776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,balanced,1.0000373522440593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.06111999750137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.10100480318069457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,2,power_law_1.2,5.051526260375977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.061286401748657224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.10075520277023316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,balanced,0.09446932872136433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,balanced,2.9313173294067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,2,power_law_1.2,10.478125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.10945279598236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.06275200247764587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,balanced,0.09864532947540283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,balanced,1.3099093437194824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.11518080234527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.06368640065193176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,balanced,0.10784000158309937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.12462719678878784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,balanced,0.14708266655604044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.16286720037460328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.06711680293083191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,balanced,1.6311465899149578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,balanced,0.1829813321431478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.1609663963317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.07000960111618042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.19693440198898315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.07266560196876526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.2644927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.07653120160102844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,balanced,5.864341100056966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,balanced,0.2757280071576436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.35740160942077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,balanced,2.6824798583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.08776320219039917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.46115841865539553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,balanced,0.34990934530893963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,power_law_1.01,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.1020095944404602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.6531968116760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,balanced,0.5079573392868042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,power_law_1.01,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.13345919847488402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.01,0.810912036895752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,power_law_1.01,0.03738240003585815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,balanced,0.6664906740188599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.1347264051437378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.01,1.153600025177002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,power_law_1.01,0.05249919891357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.17015039920806885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,power_law_1.01,0.054502397775650024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.01,1.4992128372192384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,balanced,0.9784266948699951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.22244479656219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,power_law_1.01,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.01,1.8869375228881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,power_law_1.01,0.05899519920349121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.30283520221710203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,balanced,1.297925313313802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,power_law_1.01,0.06228479743003845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.01,2.8100864410400392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.39115519523620607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,balanced,5.019023895263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,0.5591936111450195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,power_law_1.01,0.0627776026725769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.01,5.545555114746094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,balanced,1.9455040295918782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,0.7027840137481689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,power_law_1.01,0.0676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,1.003014373779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,1.356601619720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,power_law_1.01,0.07432960271835327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,balanced,2.5775200525919595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,power_law_1.01,0.07887359857559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.01,1.6831167221069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,power_law_1.01,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,power_law_1.01,0.08831359744071961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.01,2.7234495162963865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,balanced,3.222463925679525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,power_law_1.01,0.10406399965286255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.01,5.028524780273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,power_law_1.01,0.10922880172729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,power_law_1.01,0.12092800140380859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,power_law_1.01,0.15466879606246947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.055270397663116456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.01,0.20704638957977295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,balanced,5.115605354309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.05027840137481689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.01,0.2985536098480225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.05495039820671081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.07907840013504028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.01,0.37436800003051757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.08002560138702393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.01,0.5350592136383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.08158079981803894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.08496639728546143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.01,0.6942463874816894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.08559359908103943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.01,1.008236789703369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.08668799996376038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.01,1.3210432052612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.08647040128707886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.08959360122680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.01,1.9669248580932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,balanced,10.215845108032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.09401599764823913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.09964799880981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.01,2.6120704650878905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.10074880123138427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.01,3.2464065551757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.10974719524383544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.11964160203933716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,power_law_1.01,5.167737579345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.1244223952293396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.15173120498657228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,power_law_1.01,10.281196594238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.16316800117492675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.1972480058670044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.2610687971115112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.3589184045791626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.4615744113922119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.6531072139739991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,1,power_law_1.2,0.7862143993377686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,1,power_law_1.2,1.192204761505127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,1,power_law_1.2,1.509280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,1,power_law_1.2,1.9082111358642577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,1,power_law_1.2,2.833760070800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,1,power_law_1.2,5.533529663085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.04384639859199524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.041119998693466185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.057760000228881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.05886080265045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.06087039709091187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.061894398927688596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.06231039762496948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,1,power_law_1.2,0.034041601419448855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.06413440108299255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,1,power_law_1.2,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,1,power_law_1.2,0.037215998768806456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,1,power_law_1.2,0.05292159914970398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.07159039974212647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,1,power_law_1.2,0.05348479747772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.0770367980003357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,1,power_law_1.2,0.056383997201919556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.08481280207633972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,1,power_law_1.2,0.058822399377822875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.09331200122833253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,1,power_law_1.2,0.06193280220031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.10277760028839111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.12963839769363403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,1,power_law_1.2,0.06316800117492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.1349951982498169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,1,power_law_1.2,0.06659839749336242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.16855679750442504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.21924479007720948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.30664958953857424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.3946624040603638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,1,power_law_1.2,0.07373440265655518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,0.554969596862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,1,power_law_1.2,0.07905920147895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,0.6998271942138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,1,power_law_1.2,0.08025599718093872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,0.9982720375061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,1,power_law_1.2,0.08819199800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,1.3454912185668946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,1,power_law_1.2,0.10274560451507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,1,power_law_1.2,1.6959360122680665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,1,power_law_1.2,0.11039999723434449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,1,power_law_1.2,2.7267391204833986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,1,power_law_1.2,0.12224639654159546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,1,power_law_1.2,0.1648319959640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,1,power_law_1.2,5.039180755615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.2,0.2049407958984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,balanced,0.08730133374532063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,balanced,0.05745066702365875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,balanced,0.08287466565767924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.2,0.2979520082473755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,balanced,0.084389328956604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,balanced,0.06270933151245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.2,0.37369599342346194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,balanced,0.11410666505495708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,balanced,0.05682133138179779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.2,0.5315968036651612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,balanced,0.1555359959602356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,balanced,0.07588799794514973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.2,0.6914239883422851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,balanced,0.26902933915456134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,balanced,0.10486933588981628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.2,1.000921630859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,balanced,0.2723840077718099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,balanced,0.1629759967327118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.2,1.3172224044799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,balanced,0.26800533135732013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,balanced,0.164000004529953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.2,1.9549184799194337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,balanced,0.26847465833028156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,balanced,0.16461867094039917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.2,2.582271957397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,balanced,0.2694026629130046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,balanced,0.1658506691455841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,balanced,0.27003733317057294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.2,3.2147647857666017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,balanced,0.16596800088882446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,balanced,0.2723466753959656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,balanced,0.1683786710103353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,1,power_law_1.2,5.112851333618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,balanced,0.2727253238360087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,balanced,0.16922666629155478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,balanced,0.05702400207519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,balanced,0.1717546582221985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,1,power_law_1.2,10.1368896484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,balanced,0.27450666824976605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,balanced,0.1734666625658671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,balanced,0.28041066726048786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,balanced,0.05472533404827118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,balanced,0.1803306738535563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,balanced,0.057349334160486855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,balanced,0.28091732660929364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,balanced,0.07795199751853943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,balanced,0.18220800161361694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,balanced,0.28658666213353473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,balanced,0.11204800009727478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,balanced,0.1885813275973002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,balanced,0.2998720010121663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,balanced,0.15877866744995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,balanced,0.1999733249346415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,balanced,0.16076800227165222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,balanced,0.31268266836802167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,balanced,0.21172799666722616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,balanced,0.16101866960525513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,balanced,0.32524265845616657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,balanced,0.1638879974683126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.01,0.28837759494781495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,balanced,0.2341759999593099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,balanced,0.16223466396331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,balanced,0.3492319981257121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.01,0.26360321044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,balanced,0.2595679958661397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,balanced,0.16459199786186218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.01,0.2032383918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,balanced,0.3736319939295451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,balanced,0.16618667046229044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.01,0.14839680194854737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,balanced,0.1670186718304952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,balanced,0.29762667417526245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.01,0.19557119607925416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.1752895951271057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,balanced,0.16861865917841592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,balanced,0.4100480079650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.20963199138641359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,balanced,0.17684799432754517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.15850239992141724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.24296319484710693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,balanced,0.34594134489695233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.10008319616317748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,balanced,0.17749333381652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.09596800208091735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.01,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,balanced,0.18280533949534097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.11779839992523193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,balanced,0.4790506760279338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.01,0.24119679927825927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.1223039984703064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,balanced,0.4370719989140828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.01,0.24714879989624022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.15720319747924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.1551424026489258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.256115198135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,balanced,0.19378666083017984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.16241919994354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.01,0.23249280452728271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,balanced,0.5310186545054117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.149017596244812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.01,0.2592704057693481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.1557055950164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,balanced,0.5205599864323934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.01,0.27797760963439944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.16688640117645265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.01,0.28786559104919435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.16361600160598755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.01,0.31716480255126955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.16840959787368776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,balanced,0.2071146567662557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,power_law_1.01,0.16122879981994628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.01,0.31521921157836913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.18840960264205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,balanced,0.7081493536631266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.2060863971710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.01,0.3473344087600708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,balanced,0.22820266087849936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,power_law_1.01,0.15634560585021973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.17895679473876952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.01,0.3634624004364014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,power_law_1.01,0.10764800310134888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,balanced,0.7263306776682535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.23284480571746827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,balanced,0.24491200844446817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.01,0.4447807788848877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,power_law_1.01,0.09933440089225769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.23088641166687013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.01,0.4219071865081787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,power_law_1.01,0.11611520051956177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.28646399974823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.01,0.5309120178222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,power_law_1.01,0.12172160148620606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.01,0.6415743827819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.309004807472229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,power_law_1.01,0.1449280023574829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.01,0.7936192035675049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,0.39541120529174806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,balanced,0.8828106721242269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,balanced,0.28701867659886676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,power_law_1.01,0.14502400159835815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,0.4883391857147217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.01,1.083903980255127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,power_law_1.01,0.14986239671707152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,0.6128191947937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.01,1.5536959648132325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,balanced,0.9063039620717367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,power_law_1.01,0.15752960443496705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,0.8629504203796386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,balanced,0.3243359923362732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.01,1.9446592330932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,power_law_1.01,0.17048959732055663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,1.2411456108093262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.01,2.264044761657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,power_law_1.01,0.16131839752197266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,1.4213824272155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,power_law_1.01,0.17046400308609008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.01,3.3572158813476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.01,1.7506303787231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,balanced,0.44341333707173664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,power_law_1.01,0.18216320276260375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.01,7.415193939208985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,power_law_1.01,0.20165760517120362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.01,2.684435272216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,balanced,1.088752031326294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,power_law_1.01,0.21880319118499755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,power_law_1.01,0.24578559398651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.01,5.490054321289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,balanced,0.5321280161539713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,balanced,1.120400031407674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,power_law_1.01,0.25372159481048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.01,0.25553278923034667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.01,0.32072958946228025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.01,0.3983295917510986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.01,0.47022719383239747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,balanced,0.7707733313242594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.01,0.6289152145385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,balanced,1.6152480443318684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.01,0.8798720359802246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.01,1.0705920219421388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,32,power_law_1.2,0.2901952028274536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.01,1.5869312286376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,balanced,1.7157653172810872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,32,power_law_1.2,0.26333439350128174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.01,2.227859115600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,balanced,1.0059359868367512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,32,power_law_1.2,0.11439360380172729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,power_law_1.01,2.7216255187988283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,32,power_law_1.2,0.1276800036430359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.16372480392456054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.01,4.285785675048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.20339839458465575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,32,power_law_1.2,0.22036480903625488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.01,9.387181091308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.21970560550689697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.23059840202331544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.23868160247802733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,balanced,1.2549599806467693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.2519680023193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.25484158992767336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,32,power_law_1.2,0.26131200790405273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.17475199699401855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,32,power_law_1.2,0.28212480545043944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.1563199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,32,power_law_1.2,0.3077248096466064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.09661440253257751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,32,power_law_1.2,0.3157952070236206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.08746240139007569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,32,power_law_1.2,0.3277184009552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.11108479499816895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,32,power_law_1.2,0.39258880615234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.1327679991722107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,32,power_law_1.2,0.39749119281768797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.14967039823532105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.1513983964920044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,32,power_law_1.2,0.47803521156311035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,balanced,3.233781178792318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.15125759840011596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,32,power_law_1.2,0.4752319812774658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.1493888020515442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,32,power_law_1.2,0.6167359828948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,balanced,1.9952054023742676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.1559424042701721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,32,power_law_1.2,0.7494656085968018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,32,power_law_1.2,1.0474431991577149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.15564800500869752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,32,power_law_1.2,1.3542719841003419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.160806405544281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,balanced,3.375845273335775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,32,power_law_1.2,1.9571327209472655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.18305920362472533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,32,power_law_1.2,2.798956871032715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.20134398937225342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.21967999935150145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,32,power_law_1.2,3.3042240142822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.20122239589691163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,32,power_law_1.2,4.582950210571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.250163197517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.2590208053588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,32,power_law_1.2,12.412754821777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.3279871940612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,0.34574079513549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,0.44176640510559084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,0.5426112174987793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,0.8931327819824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,0.9820799827575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,1.3992064476013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,1.7671871185302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,32,power_law_1.2,2.355743980407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,32,power_law_1.2,3.793977737426758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,32,power_law_1.2,7.696326446533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,balanced,3.996351877848307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,balanced,0.06778666873772939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,balanced,0.06464533507823944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,balanced,0.06989866495132446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,balanced,0.10364799698193868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,balanced,0.1562346617380778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,balanced,0.2730293273925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,balanced,0.2749279936154683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,32,power_law_1.2,0.16236799955368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,balanced,0.2725546757380168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,balanced,0.2733866572380066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,32,power_law_1.2,0.15598080158233643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,balanced,0.27375467618306476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,balanced,0.27270400524139404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,32,power_law_1.2,0.07415680289268493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,balanced,0.27686933676401776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,balanced,0.2764693299929301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,32,power_law_1.2,0.09377920031547546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,balanced,0.2781226634979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,32,power_law_1.2,0.11289600133895875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,balanced,0.2871573368708293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,balanced,0.2879199981689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,32,power_law_1.2,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,balanced,0.2938133279482524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,32,power_law_1.2,0.1348863959312439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,balanced,0.3076000014940898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,32,power_law_1.2,0.14416639804840087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,balanced,0.3264106710751851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,32,power_law_1.2,0.1518847942352295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,balanced,0.34268800417582196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,32,power_law_1.2,0.14743679761886597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,32,power_law_1.2,0.16454399824142457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,balanced,0.3682719866434733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,32,power_law_1.2,0.1756608009338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,32,power_law_1.2,0.1748095989227295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,balanced,0.3948800166447957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,32,power_law_1.2,0.18447999954223632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,32,power_law_1.2,0.20631039142608643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,balanced,0.4373866717020671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,balanced,0.05007466673851013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,32,power_law_1.2,0.22465920448303223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,balanced,0.050928001602490745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,32,power_law_1.2,0.268883204460144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,balanced,0.0561706672112147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,balanced,0.5167200167973837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,balanced,0.0768746683994929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,balanced,0.10662399729092915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,balanced,0.16209066907564798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,32,power_law_1.2,0.29548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,balanced,0.16527466972668967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,balanced,0.1651946703592936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,balanced,0.16723199685414633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,balanced,0.5852373441060384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,balanced,0.16683199008305868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.2,0.27974400520324705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,balanced,0.1697653333346049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.2,0.3539007902145386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,balanced,0.17072000106175741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,balanced,0.17363200585047403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.2,0.4379712104797363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,balanced,0.17553067207336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,balanced,0.18263999621073404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.2,0.6074687957763671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,balanced,0.18481600284576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,balanced,0.7904213269551595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,balanced,0.19074666500091553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.2,0.6743231773376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.2,1.100921630859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,balanced,0.2050079902013143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,balanced,0.21714667479197183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.2,1.3604543685913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,balanced,0.24404799938201904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.2,2.515974426269531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,balanced,0.2714400092760722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.2,2.941548728942871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,balanced,0.9811360041300455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,balanced,0.317466676235199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,32,power_law_1.2,3.8006145477294924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.2,6.797254180908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,balanced,0.37649067242940265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,balanced,0.047370667258898415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.2,14.560000610351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,balanced,0.047637333472569786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,balanced,0.05795733133951823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,balanced,0.4697653452555339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.01,0.16980479955673217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,balanced,0.07901333272457123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,balanced,0.11372266213099162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.01,0.26904959678649903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,balanced,1.201317310333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,balanced,0.15959466497103372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.01,0.13425920009613038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,balanced,0.16193067034085593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,balanced,0.5661813418070475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.01,0.11817599534988403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,balanced,0.1620319982369741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.01,0.10762879848480225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,balanced,0.16436800360679626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.01,0.13963520526885986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,balanced,0.16420800487200418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.01,0.16984319686889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.01,0.15777280330657958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,balanced,0.16646933555603027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.01,0.2222975969314575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.01,0.09164800047874451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,balanced,0.16811732451121011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.01,0.21833600997924804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,balanced,0.7832372983296713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.01,0.08797439932823181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,balanced,0.17056532700856528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.01,0.2348031997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,balanced,0.17246399323145548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.01,0.10799360275268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,balanced,0.18081599473953247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.01,0.23189120292663573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.01,0.12126719951629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,balanced,0.18253866831461588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.01,0.2295936107635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.01,0.14150400161743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,balanced,0.1890933314959208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.01,0.23508479595184326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.01,0.1444159984588623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.01,0.24384000301361083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,balanced,1.8986666997273762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.01,0.14714239835739135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.01,0.2535936117172241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,balanced,1.0039146741231282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.01,0.14919040203094483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.01,0.2707711935043335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.01,0.1444991946220398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,balanced,0.2034506599108378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.01,0.2820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.01,0.15529600381851197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.01,0.3027519941329956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.01,0.15982719659805297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.01,0.3468224048614502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,16,power_law_1.2,0.14999040365219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.01,0.16469759941101075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.01,0.3509183883666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,power_law_1.01,0.11486719846725464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.01,0.17870080471038818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,16,power_law_1.2,0.2687743902206421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.01,0.4091775894165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,power_law_1.01,0.16383999586105347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.01,0.18513280153274536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,16,power_law_1.2,0.09326720237731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.01,0.39874560832977296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,balanced,0.22259734074274698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,balanced,1.2474506696065266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,power_law_1.01,0.09578880071640014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.01,0.1890176057815552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,16,power_law_1.2,0.11708799600601197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.01,0.5409088134765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,balanced,0.24737600485483804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,power_law_1.01,0.08431360125541687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,16,power_law_1.2,0.12536319494247436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.01,0.21155200004577637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.01,0.5608511924743652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,16,power_law_1.2,0.18017280101776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,balanced,0.2712213397026062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,power_law_1.01,0.10452480316162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.01,0.23165440559387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.01,0.7472640037536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,16,power_law_1.2,0.23588480949401855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.01,0.2819648027420044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,power_law_1.01,0.11964160203933716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.01,0.8778880119323731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,balanced,0.3349706729253133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,16,power_law_1.2,0.2337536096572876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.01,0.31623680591583253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,power_law_1.01,0.14561280012130737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.01,1.4583104133605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,16,power_law_1.2,0.22734720706939698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.01,0.3774912118911743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,power_law_1.01,0.149126398563385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.01,1.7786815643310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,balanced,0.39762667814890545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,16,power_law_1.2,0.2277440071105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.01,0.48561921119689944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,power_law_1.01,0.14494080543518068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.01,2.0618431091308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,16,power_law_1.2,0.23144960403442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.01,0.6397503852844239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,power_law_1.01,0.15600639581680298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,16,power_law_1.2,0.2498687982559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.01,3.08602237701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,power_law_1.01,0.15358079671859742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.01,0.7654848098754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,balanced,0.561738650004069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,16,power_law_1.2,0.25250558853149413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,power_law_1.01,0.16584320068359376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.01,1.0529919624328614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,16,power_law_1.2,0.269651198387146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.01,6.286956787109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,power_law_1.01,0.1685312032699585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,16,power_law_1.2,0.28286080360412597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,balanced,1.9172800381978352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.01,1.5250368118286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,power_law_1.01,0.18012160062789917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,16,power_law_1.2,0.29868159294128416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,balanced,3.6835571924845376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.01,1.7476736068725587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,balanced,0.6704426606496176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,power_law_1.01,0.19448959827423096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,16,power_law_1.2,0.3253632068634033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,power_law_1.01,0.1979200005531311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.01,2.86822395324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,16,power_law_1.2,0.37360639572143556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,power_law_1.01,0.22783360481262208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,16,power_law_1.2,0.3737920045852661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.01,5.53138542175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,16,power_law_1.2,0.4273856163024902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,16,power_law_1.2,0.464844799041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,power_law_1.01,0.24770560264587402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,balanced,0.9677386283874512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,16,power_law_1.2,0.6391488075256347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,16,power_law_1.2,0.7263487815856934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,power_law_1.01,0.26711039543151854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,16,power_law_1.2,0.8739392280578613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,power_law_1.01,0.3229824066162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,16,power_law_1.2,1.249824047088623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,power_law_1.01,0.40052480697631837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,16,power_law_1.2,1.5860608100891114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,power_law_1.01,0.498367977142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,balanced,1.2703039646148682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,16,power_law_1.2,2.2242687225341795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,power_law_1.01,0.6530687808990479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,16,power_law_1.2,3.289440155029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,power_law_1.01,0.8851840019226074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,16,power_law_1.2,4.857734298706054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,power_law_1.01,1.2539648056030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,power_law_1.01,1.6944639205932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,16,power_law_1.2,9.929158020019532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,power_law_1.01,2.2143999099731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,power_law_1.01,2.7810495376586912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,balanced,1.5873600641886394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,power_law_1.01,4.1788288116455075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,power_law_1.01,9.350022125244141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,balanced,3.804080009460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,16,power_law_1.2,0.10894080400466918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,16,power_law_1.2,0.1552896022796631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,16,power_law_1.2,0.06771199703216553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,balanced,2.5023786226908364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,16,power_law_1.2,0.08883200287818908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,16,power_law_1.2,0.10586880445480347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,16,power_law_1.2,0.11612800359725953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,16,power_law_1.2,0.14281599521636962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,16,power_law_1.2,0.1436095952987671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,16,power_law_1.2,0.1323199987411499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,16,power_law_1.2,0.14942079782485962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,16,power_law_1.2,0.158406400680542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,16,power_law_1.2,0.15770879983901978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,16,power_law_1.2,0.15908479690551758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,16,power_law_1.2,0.17204480171203612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,16,power_law_1.2,0.17870719432830812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,16,power_law_1.2,0.18907519578933715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,16,power_law_1.2,0.21303679943084716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,16,power_law_1.2,0.2403712034225464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,16,power_law_1.2,0.24528639316558837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,16,power_law_1.2,0.31164159774780276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,16,power_law_1.2,0.355347204208374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,16,power_law_1.2,0.41227521896362307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,16,power_law_1.2,0.5452544212341308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,16,power_law_1.2,0.7507584095001221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,balanced,5.016266822814941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,16,power_law_1.2,0.9109696388244629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,16,power_law_1.2,1.2087679862976075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,16,power_law_1.2,1.707788848876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,16,power_law_1.2,1.8251775741577148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,16,power_law_1.2,3.299737548828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,16,power_law_1.2,7.995699310302735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,balanced,0.056549335519472756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,16,power_law_1.2,0.11421439647674561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,balanced,0.06197333335876465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,16,power_law_1.2,0.1602560043334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,balanced,0.07063999772071838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,16,power_law_1.2,0.06325119733810425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,balanced,0.10539199908574422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,16,power_law_1.2,0.08394240140914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,balanced,0.1629759967327118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,16,power_law_1.2,0.10049920082092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,balanced,0.273632009824117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,balanced,0.2771093249320984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,balanced,0.04923733572165171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,16,power_law_1.2,0.11048959493637085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,balanced,0.2758026719093323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,16,power_law_1.2,0.1423359990119934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,balanced,0.055733333031336464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,balanced,0.27447466055552167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,16,power_law_1.2,0.14851200580596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,balanced,0.2775626579920451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,balanced,0.05513066550095876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,16,power_law_1.2,0.15602560043334962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,balanced,0.07695466776688893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,balanced,0.27988266944885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,16,power_law_1.2,0.15123840570449829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,balanced,0.10657599568367004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,balanced,0.28014399607976276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,16,power_law_1.2,0.1574079990386963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,balanced,0.1639786660671234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,16,power_law_1.2,0.1649664044380188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,balanced,0.28383467594782513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,balanced,0.16613333423932394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,16,power_law_1.2,0.1682368040084839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,balanced,0.16759467124938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,balanced,0.2837120095888774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,16,power_law_1.2,0.18026880025863648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,balanced,0.16936532656351724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,balanced,0.2937493324279785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,16,power_law_1.2,0.2050368070602417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,balanced,0.16983999808629355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,16,power_law_1.2,0.21276159286499025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,balanced,0.29340799649556476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,balanced,0.17230933904647827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,16,power_law_1.2,0.2428287982940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,balanced,0.17399466037750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,balanced,0.3028533260027568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,balanced,0.1758400003115336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,balanced,0.32014934221903485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,balanced,0.17915199200312296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,16,power_law_1.2,0.2874624013900757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,balanced,0.1872319976488749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,balanced,0.3351200024286906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,balanced,0.19012266397476196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,balanced,0.3704640070597331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,balanced,0.19738666216532388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,16,power_law_1.2,0.2804863929748535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,16,power_law_1.2,0.3608896017074585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,balanced,0.21257599194844565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,balanced,0.39614399274190265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.01,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,16,power_law_1.2,0.4349376201629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.01,0.07555840015411378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,balanced,0.23563732703526816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.01,0.15363199710845948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,16,power_law_1.2,0.5644224166870118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,balanced,0.4402720133463542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.01,0.09821439981460571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,balanced,0.267850657304128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.01,0.09452800154685974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,16,power_law_1.2,0.6496767997741699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.01,0.06573439836502075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.01,0.10118399858474732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,balanced,0.295632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,16,power_law_1.2,0.9976703643798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.01,0.076665598154068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,balanced,0.04909333089987437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,balanced,0.49021867911020917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.01,0.14183679819107056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,16,power_law_1.2,1.3736767768859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.01,0.0942911982536316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,balanced,0.051872000098228455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.01,0.15363839864730836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,balanced,0.35180266698201496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,balanced,0.05839466551939646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,16,power_law_1.2,2.3359552383422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.01,0.11159039735794067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.01,0.21293439865112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,balanced,0.08239999910195668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,balanced,0.5973493258158366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.01,0.21120638847351075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.01,0.13069440126419068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,16,power_law_1.2,2.8665792465209963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,balanced,0.11571199695269267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,balanced,0.421674648920695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.01,0.21675519943237304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.01,0.14366719722747803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,balanced,0.16524266203244528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,16,power_law_1.2,3.6781822204589845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,balanced,0.16805867354075113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.01,0.22581119537353517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.01,0.14392319917678834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,balanced,0.1691840092341105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.01,0.2369663953781128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,16,power_law_1.2,6.264492797851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,balanced,0.5453706582387289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,balanced,0.17003200451533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.01,0.14709759950637818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,balanced,0.6975306669871012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.01,0.22748799324035646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,balanced,0.17163733641306558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.01,0.15336320400238038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,balanced,0.1738026738166809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.01,0.24931199550628663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,16,power_law_1.2,12.58950424194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.01,0.1549183964729309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,balanced,0.17615467309951782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.01,0.2656831979751587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.01,0.1586176037788391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,balanced,0.17915733655293783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,balanced,0.6743840376536051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.01,0.27895679473876955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,balanced,0.18214933077494302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.01,0.16615040302276612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.01,0.2721407890319824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,balanced,0.19275200366973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,balanced,0.9296000003814697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.01,0.17956479787826538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,balanced,0.19564799467722574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.01,0.2891839981079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.01,0.18419840335845947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,balanced,0.20522133509318033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.01,0.19687680006027222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.01,0.3337791919708252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.01,0.35262720584869384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.01,0.2292479991912842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,balanced,0.94706130027771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.01,0.4146687984466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.01,0.24462080001831055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.01,0.28786559104919435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.01,0.4240896224975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.01,0.3285183906555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,balanced,0.22802132368087769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.01,0.5375552177429199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.01,0.39898879528045655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,balanced,1.1761706670125325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.01,0.5740223884582519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.01,0.47608962059021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.01,0.7910528182983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.01,0.6405951976776123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.01,0.9342911720275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.01,0.8107135772705079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.01,1.3045120239257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,balanced,1.183733304341634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.01,1.1637696266174316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.01,1.7690496444702148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,balanced,0.2537333369255066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.01,1.5305536270141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.01,2.145030403137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,balanced,0.3014613389968872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.01,3.239545440673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.01,2.0258880615234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,balanced,0.34876267115275067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.01,2.8756992340087892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.01,6.487091064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,balanced,1.4743626912434895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.01,6.1042945861816404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,balanced,0.45344531536102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,power_law_1.01,0.08487679958343505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,balanced,1.4935894012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,power_law_1.01,0.10940799713134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,balanced,0.535647988319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,power_law_1.01,0.07514240145683289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,power_law_1.01,0.08238080143928528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,power_law_1.01,0.1016319990158081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,balanced,0.7695146401723226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,8,power_law_1.2,0.10622719526290894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,power_law_1.01,0.11196800470352172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,8,power_law_1.2,0.13281279802322388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,power_law_1.01,0.1413632035255432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,8,power_law_1.2,0.07029119729995728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,8,power_law_1.2,0.1066431999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,power_law_1.01,0.14568320512771607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,8,power_law_1.2,0.13556480407714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,balanced,0.9349599679311117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,power_law_1.01,0.1513216018676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,8,power_law_1.2,0.15395840406417846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,power_law_1.01,0.15030399560928345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,8,power_law_1.2,0.2141119956970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,balanced,2.2303892771402993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,8,power_law_1.2,0.2200256109237671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,power_law_1.01,0.1614400029182434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,8,power_law_1.2,0.23567359447479247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,power_law_1.01,0.16494719982147216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,8,power_law_1.2,0.22721920013427735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,balanced,2.2622507413228354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,power_law_1.01,0.1724544048309326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,8,power_law_1.2,0.2430527925491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,power_law_1.01,0.1890176057815552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,8,power_law_1.2,0.2410304069519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,balanced,1.3725600242614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,power_law_1.01,0.19785599708557128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,8,power_law_1.2,0.24476161003112792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,8,power_law_1.2,0.26513919830322263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,power_law_1.01,0.20906240940093995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,8,power_law_1.2,0.27653119564056394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,power_law_1.01,0.23760640621185303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,8,power_law_1.2,0.31050240993499756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,8,power_law_1.2,0.3146752119064331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,8,power_law_1.2,0.34863359928131105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,power_law_1.01,0.264902400970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,8,power_law_1.2,0.3860608100891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,8,power_law_1.2,0.4715519905090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,8,power_law_1.2,0.44960641860961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,power_law_1.01,0.29896318912506104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,balanced,1.8102879524230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,8,power_law_1.2,0.5776127815246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,8,power_law_1.2,0.6752575874328614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,power_law_1.01,0.3909440040588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,8,power_law_1.2,0.9287936210632324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,power_law_1.01,0.4785600185394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,8,power_law_1.2,0.9804351806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,power_law_1.01,0.615174388885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,8,power_law_1.2,1.6890432357788085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,power_law_1.01,0.709657621383667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,8,power_law_1.2,2.030988883972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,power_law_1.01,1.0185536384582519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,8,power_law_1.2,2.7749631881713865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,power_law_1.01,1.3908351898193358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,8,power_law_1.2,4.379513549804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,power_law_1.01,1.8770175933837892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,balanced,2.256394704182943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,power_law_1.2,9.334464263916015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,power_law_1.01,2.7720256805419923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,power_law_1.01,3.2940673828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,power_law_1.01,5.220044708251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,8,balanced,4.418848037719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,power_law_1.01,10.68787841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,balanced,4.476101239522298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,balanced,3.580575942993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,8,power_law_1.2,0.07564160227775574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,8,power_law_1.2,0.0972927987575531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,8,power_law_1.2,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,8,power_law_1.2,0.07678719758987426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,8,power_law_1.2,0.0869376003742218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,8,power_law_1.2,0.10658559799194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,8,power_law_1.2,0.1398144006729126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,8,power_law_1.2,0.13950719833374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,8,power_law_1.2,0.14149760007858275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,8,power_law_1.2,0.14534399509429932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,8,power_law_1.2,0.15326080322265626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,8,power_law_1.2,0.16364799737930297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,8,power_law_1.2,0.16161279678344725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,8,power_law_1.2,0.16496000289916993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,balanced,7.175488154093425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,8,power_law_1.2,0.18353279829025268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,8,power_law_1.2,0.1879744052886963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,8,power_law_1.2,0.08056960105895997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,8,power_law_1.2,0.2036288022994995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,8,power_law_1.2,0.10659199953079224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,8,power_law_1.2,0.2356031894683838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,8,power_law_1.2,0.24778881072998046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,8,power_law_1.2,0.061388802528381345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,balanced,0.05730666716893514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,8,power_law_1.2,0.29129600524902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,8,power_law_1.2,0.07808640003204345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,balanced,0.06136000156402588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,8,power_law_1.2,0.09253119826316833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,8,power_law_1.2,0.35216000080108645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,balanced,0.07227199772993724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,8,power_law_1.2,0.4497856140136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,8,power_law_1.2,0.10212479829788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,balanced,0.10460799932479858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,8,power_law_1.2,0.13948800563812255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,8,power_law_1.2,0.5398911952972412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,balanced,0.16386666893959045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,balanced,0.2765386700630188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,8,power_law_1.2,0.14451199769973755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,8,power_law_1.2,0.709606409072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,balanced,0.2778079907099406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,8,power_law_1.2,0.14743679761886597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,8,power_law_1.2,0.9039104461669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,balanced,0.2771679957707723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,8,power_law_1.2,0.1555840015411377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,8,power_law_1.2,1.267692756652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,balanced,0.27801599105199176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,8,power_law_1.2,0.1553536057472229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,balanced,0.27979199091593426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,8,power_law_1.2,1.8380928039550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,8,power_law_1.2,0.16902400255203248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,balanced,0.2820799946784973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,8,power_law_1.2,0.17161600589752196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,8,power_law_1.2,2.196569633483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,balanced,0.2847893238067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,8,power_law_1.2,0.18528000116348267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,8,power_law_1.2,3.5868862152099608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,balanced,0.2860320011774699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,8,power_law_1.2,0.20851199626922606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,balanced,0.2900213400522868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,8,power_law_1.2,0.2235327959060669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,8,power_law_1.2,7.378713226318359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,balanced,0.29764266808827716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,8,power_law_1.2,0.24097919464111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,balanced,0.3020426630973816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,balanced,0.3113226691881816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,8,power_law_1.2,0.28336639404296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,balanced,0.33315199613571167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,balanced,0.36505599816640216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,8,power_law_1.2,0.29405438899993896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,balanced,0.40808534622192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,8,power_law_1.2,0.3914367914199829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,8,power_law_1.2,0.483948802947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,balanced,0.4431999921798706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,8,power_law_1.2,0.6285568237304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,balanced,0.5278879801432291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,8,power_law_1.2,0.8215359687805176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,balanced,0.04955733319123586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,balanced,0.05178666611512502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,8,power_law_1.2,1.2099136352539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,balanced,0.05724266668160757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,balanced,0.6104586521784464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,8,power_law_1.2,1.588697624206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,balanced,0.07905599971612294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,balanced,0.11059733231862386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,8,power_law_1.2,2.4602048873901365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,balanced,0.1710666616757711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,balanced,0.1735466718673706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,8,power_law_1.2,3.6296833038330076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,balanced,0.17526400089263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,balanced,0.7826933066050211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,balanced,0.1769333283106486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,8,power_law_1.2,3.9178367614746095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,balanced,0.17971199750900269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,balanced,0.18204800287882486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,8,power_law_1.2,6.095782470703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,balanced,0.18826667467753092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,balanced,0.18869866927464804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,balanced,0.9705333709716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.01,0.05727999806404114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,balanced,0.1965386668841044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.01,0.073990398645401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,8,power_law_1.2,16.12665557861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.01,0.07319679856300354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,balanced,0.2058453361193339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.01,0.10038399696350098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.01,0.059539198875427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,balanced,0.20797866582870483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.01,0.07939839959144593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.01,0.07427200078964233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,balanced,0.2188053329785665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.01,0.09685760140419006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,balanced,0.059088001648585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.01,0.09314560294151306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.01,0.1295232057571411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,balanced,0.06281066437562306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,balanced,0.2405173381169637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,balanced,1.3398240407307942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.01,0.11887359619140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.01,0.1537727952003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,balanced,0.07008000214894612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,balanced,0.2717333237330119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.01,0.1380288004875183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.01,0.19922560453414917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,balanced,0.09128533800443013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.01,0.14513280391693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.01,0.2086400032043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,balanced,0.11981333295504253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,balanced,0.319269339243571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.01,0.14565119743347169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.01,0.22031359672546386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,balanced,0.1861226757367452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.01,0.15123200416564941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,balanced,0.18730133771896362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.01,0.2244863986968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,balanced,0.3453173240025838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,balanced,0.19010132551193237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.01,0.16187520027160646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.01,0.24356479644775392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,balanced,0.19164266188939413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.01,0.25153920650482176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.01,0.16600320339202881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,balanced,0.4336320161819458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,balanced,0.19477866093317667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,balanced,1.6327892939249675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.01,0.25452799797058107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.01,0.17251839637756347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,balanced,0.19849600394566855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.01,0.2752511978149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.01,0.1833407998085022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,balanced,0.20253332455952963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,balanced,0.5332693258921305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,balanced,0.20638932784398398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.01,0.2788671970367432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.01,0.1996224045753479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,balanced,0.21402132511138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.01,0.30570240020751954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.01,0.2073728084564209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,balanced,0.22759467363357544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.01,0.30935680866241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.01,0.218176007270813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,balanced,0.23478933175404867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.01,0.35910398960113527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.01,0.24607999324798585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,balanced,0.7187253634134928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,balanced,0.24725866317749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.01,0.3854527950286865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.01,0.2799423933029175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.01,0.43301119804382326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.01,0.34073600769042967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,balanced,2.081493377685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.01,0.399833607673645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.01,0.4659520149230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,balanced,0.9175786972045898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.01,0.4771584033966064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,balanced,0.2874666651089986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.01,0.5942656040191651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.01,0.5723648071289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.01,0.6751296043395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.01,0.948089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.01,0.8212608337402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.01,1.067840003967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.01,0.9982144355773925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.01,1.6201791763305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.01,1.4297599792480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,balanced,0.3575199842453003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,balanced,1.3352160453796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.01,1.864384078979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.01,1.9019392013549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,balanced,0.4427200158437093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.01,2.4433664321899413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.01,2.517523193359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,balanced,0.5013759930928549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.01,3.809574508666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.01,3.7712257385253904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,balanced,0.6893706321716309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.01,7.335673522949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.01,7.649644470214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,balanced,3.0408852895100913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,power_law_1.01,0.07622399926185608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,balanced,0.8225279649098715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,balanced,1.6097973187764485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,power_law_1.01,0.08899199962615967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,power_law_1.01,0.08047360181808472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,power_law_1.01,0.0832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,balanced,1.2548853556315105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,power_law_1.01,0.10559999942779541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,power_law_1.01,0.12396160364151002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,power_law_1.01,0.15111680030822755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,power_law_1.01,0.15864959955215455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,power_law_1.01,0.16940799951553345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,balanced,1.5468319257100422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,power_law_1.01,0.16230399608612062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,balanced,2.0430506070454917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,power_law_1.01,0.18421759605407714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,power_law_1.01,0.18843519687652588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,power_law_1.01,0.1932927966117859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,power_law_1.01,0.21906559467315673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,balanced,2.2604907353719077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,power_law_1.01,0.2346496105194092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,power_law_1.01,0.2641216039657593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,power_law_1.01,0.2904191970825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,4,power_law_1.2,0.07400320172309875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,power_law_1.01,0.356825590133667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,4,power_law_1.2,0.1013375997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,balanced,2.961711883544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,4,power_law_1.2,0.06555520296096802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,power_law_1.01,0.40303359031677244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,4,power_law_1.2,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,power_law_1.01,0.5116928100585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,balanced,3.1063785552978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,4,power_law_1.2,0.11977599859237671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,power_law_1.01,0.5936575889587402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,4,power_law_1.2,0.1531008005142212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,4,power_law_1.2,0.196070396900177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,power_law_1.01,0.7868800163269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,balanced,5.944501241048177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,4,power_law_1.2,0.20768001079559326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,power_law_1.01,1.0507264137268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,4,power_law_1.2,0.22286078929901124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,power_law_1.01,1.4425087928771974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,4,power_law_1.2,0.22593278884887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,4,power_law_1.2,0.2442239999771118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,power_law_1.01,1.9490432739257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,balanced,3.6905225118001304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,4,power_law_1.2,0.2547647953033447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,power_law_1.01,2.9267520904541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,4,power_law_1.2,0.2587584018707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,power_law_1.01,3.8009857177734374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,4,power_law_1.2,0.270086407661438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,power_law_1.01,4.917772674560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,4,power_law_1.2,0.30392320156097413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,4,power_law_1.2,0.3201855897903442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,power_law_1.01,6.791923522949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,4,power_law_1.2,0.34987521171569824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,4,power_law_1.2,0.37550721168518064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,power_law_1.01,14.808210754394532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,4,power_law_1.2,0.3884671926498413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,4,power_law_1.2,0.05754240155220032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,4,power_law_1.2,0.45550079345703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,4,power_law_1.2,0.49541759490966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,4,power_law_1.2,0.07177600264549255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,4,power_law_1.2,0.05600000023841858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,4,power_law_1.2,0.6141119956970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,balanced,5.805941263834636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,4,power_law_1.2,0.06954240202903747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,4,power_law_1.2,0.7481728076934815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,4,power_law_1.2,0.08694400191307068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,4,power_law_1.2,0.9414336204528808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,4,power_law_1.2,0.10294400453567505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,4,power_law_1.2,1.202387237548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,4,power_law_1.2,0.13343360424041747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,4,power_law_1.2,1.6900032043457032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,4,power_law_1.2,0.1399616003036499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,balanced,6.096719741821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,4,power_law_1.2,2.380614471435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,4,power_law_1.2,0.14499839544296264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,4,power_law_1.2,3.082131195068359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,4,power_law_1.2,0.1509951949119568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,4,power_law_1.2,0.16317440271377565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,4,power_law_1.2,5.054899215698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,4,power_law_1.2,0.16129280328750611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,4,power_law_1.2,0.17390079498291017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,4,power_law_1.2,8.140447998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,4,power_law_1.2,0.18592640161514282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,4,power_law_1.2,0.1992576003074646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,4,power_law_1.2,0.21250560283660888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,4,power_law_1.2,0.22014079093933106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,4,power_law_1.2,0.2593280076980591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,4,power_law_1.2,0.2815680027008057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,4,power_law_1.2,0.36078081130981443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,4,power_law_1.2,0.40071678161621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,4,power_law_1.2,0.5057216167449952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,4,power_law_1.2,0.6279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,4,power_law_1.2,0.863212776184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,4,power_law_1.2,1.1201151847839355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,4,power_law_1.2,1.6560960769653321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,balanced,11.5982297261556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,4,power_law_1.2,1.9577728271484376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,balanced,0.058650667468706764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,4,power_law_1.2,2.5059072494506838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,balanced,0.06397866706053416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,balanced,0.07459733386834462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,4,power_law_1.2,4.003731155395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,balanced,0.10846400260925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,4,power_law_1.2,0.0739135980606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,balanced,0.17332265774408975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,4,power_law_1.2,8.26537628173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,4,power_law_1.2,0.08657280206680298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,balanced,0.29413866996765137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,4,power_law_1.2,0.06910719871520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,balanced,0.29684267441431683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,4,power_law_1.2,0.08401280045509338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,4,power_law_1.2,0.10309120416641235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,balanced,0.2955519954363505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,4,power_law_1.2,0.11633919477462769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,balanced,0.2990666627883911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,4,power_law_1.2,0.15054080486297608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,4,power_law_1.2,0.16535040140151977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,balanced,0.30341867605845135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,4,power_law_1.2,0.15930240154266356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,balanced,0.3109760085741679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,4,power_law_1.2,0.1675968050956726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,balanced,0.316106657187144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,4,power_law_1.2,0.18186240196228026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,4,power_law_1.2,0.1949504017829895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,balanced,0.3192373315493266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,4,power_law_1.2,0.20678400993347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,4,power_law_1.2,0.21952641010284424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,balanced,0.3107200066248576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,4,power_law_1.2,0.2364351987838745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,balanced,0.3217173417409261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,4,power_law_1.2,0.25804159641265867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,balanced,0.3254133264223735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,4,power_law_1.2,0.29935359954833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,balanced,0.3373440106709798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,4,power_law_1.2,0.36241281032562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,balanced,0.37703998883565265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,balanced,0.42466668287913006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,4,power_law_1.2,0.40802559852600095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,balanced,0.49252267678578693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,4,power_law_1.2,0.5352575778961182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,4,power_law_1.2,0.627948808670044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,balanced,0.5482079982757568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,4,power_law_1.2,0.8724479675292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,4,power_law_1.2,1.1118207931518556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,balanced,0.7074613571166992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,4,power_law_1.2,1.547424030303955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,balanced,0.05217599868774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,4,power_law_1.2,2.240928077697754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,balanced,0.871946652730306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,balanced,0.05462400118509928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,4,power_law_1.2,2.990329551696777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,balanced,0.06388266881306966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,balanced,0.0878613293170929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,4,power_law_1.2,4.063577651977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,balanced,0.12924800316492716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,balanced,0.20237332582473755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,balanced,1.20960529645284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,4,power_law_1.2,4.886662292480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,balanced,0.20356265703837076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,balanced,0.204367995262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,4,power_law_1.2,7.8245697021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,balanced,0.2079040010770162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,balanced,0.20893865823745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,balanced,1.5361653963724773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,balanced,0.2117919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,4,power_law_1.2,17.904051208496092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,balanced,0.21629865964253744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,balanced,0.22105600436528525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,balanced,0.22573866446812949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,balanced,0.23662932713826498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,balanced,0.24194133281707764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,balanced,2.197813351949056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,balanced,0.26077866554260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,balanced,0.2982293367385864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,balanced,0.3380533456802368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,balanced,0.3922559817632039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,balanced,0.4490826527277629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,balanced,2.6269920667012534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,balanced,0.6064373254776001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.01,0.06102399826049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,balanced,0.08027199904123943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.01,0.07265920042991639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,balanced,0.7647573153177897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,balanced,0.08560533324877422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.01,0.06929280161857605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,balanced,0.09293333689371745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.01,0.09086719751358033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,balanced,0.11703466375668843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,balanced,0.16110933820406595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.01,0.13085440397262574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,balanced,1.085263967514038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,balanced,0.23057599862416586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.01,0.15663360357284545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,balanced,0.2369920015335083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,balanced,3.32207457224528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,balanced,0.24109333753585815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.01,0.21955840587615966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.01,0.05370240211486817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,balanced,0.2452053427696228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.01,0.22692480087280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.01,0.061312001943588254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,balanced,1.4156640370686848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,balanced,0.24837867418924967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.01,0.2353663921356201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,balanced,0.2567360003789266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.01,0.0564736008644104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.01,0.24046719074249268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,balanced,0.26626133918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.01,0.0780672013759613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.01,0.2532351970672607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,balanced,0.274122675259908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.01,0.09905279874801635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.01,0.2660736083984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.01,0.12325760126113891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,balanced,0.28517866134643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.01,0.28047358989715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,balanced,2.055456002553304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.01,0.15549440383911134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,balanced,0.305786669254303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.01,0.28409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,balanced,0.32012800375620526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.01,0.16558079719543456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.01,0.3047231912612915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,balanced,0.3514933188756307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.01,0.17100160121917723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.01,0.174508798122406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.01,0.33196799755096434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.01,0.18562560081481932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.01,0.3353919982910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.01,0.19475200176239013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,balanced,4.996954600016276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.01,0.41736321449279784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,balanced,0.43824533621470135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.01,0.20421760082244872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,balanced,2.458090623219808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.01,0.45984640121459963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.01,0.22495360374450685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.01,0.5390399932861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.01,0.24102399349212647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.01,0.6150527954101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.01,0.25109119415283204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,power_law_1.01,0.08195199966430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.01,0.7400959968566895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.01,0.2668864011764526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,balanced,0.5506293376286825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.01,0.9320511817932129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,power_law_1.01,0.09182080030441284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.01,0.3076672077178955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,2,power_law_1.2,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,power_law_1.01,0.09475839734077454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.01,0.3420543909072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.01,1.245952033996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,balanced,0.7038293679555258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,power_law_1.01,0.11042560338973999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,2,power_law_1.2,0.07271040081977845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.01,0.4056511878967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.01,1.5314111709594727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,power_law_1.01,0.13233280181884766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,balanced,3.1605920791625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,balanced,0.8000533580780029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,2,power_law_1.2,0.06529920101165772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.01,0.4875391960144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.01,2.2855808258056642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,power_law_1.01,0.15205119848251342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,2,power_law_1.2,0.08635519742965699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.01,0.6179903984069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,power_law_1.01,0.19341440200805665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.01,2.8291711807250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,2,power_law_1.2,0.11995520591735839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,balanced,1.1588106950124104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,power_law_1.01,0.2061824083328247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.01,0.7840191841125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,power_law_1.01,0.21171200275421143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.01,3.5157119750976564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,2,power_law_1.2,0.1431040048599243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.01,1.0812224388122558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,power_law_1.01,0.2180351972579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,2,power_law_1.2,0.20736000537872315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,balanced,1.3951999346415203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,power_law_1.01,0.24135680198669435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.01,1.428275203704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.01,5.9485633850097654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,2,power_law_1.2,0.22236158847808837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,power_law_1.01,0.2522111892700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.01,2.0652544021606447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,2,power_law_1.2,0.23057279586791993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,power_law_1.01,0.26358399391174314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.01,12.038227081298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,power_law_1.01,0.2949183940887451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,2,power_law_1.2,0.23914239406585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.01,2.666387176513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,balanced,2.1450506846110025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,power_law_1.01,0.3099967956542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,2,power_law_1.2,0.25924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,power_law_1.01,0.34922239780426023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.01,3.153318405151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,2,power_law_1.2,0.2651648044586182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,power_law_1.01,0.4096640110015869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,2,power_law_1.2,0.28465919494628905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.01,5.294086456298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,2,power_law_1.2,0.294649600982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,2,power_law_1.2,0.3338112115859985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,balanced,2.666378657023112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,balanced,4.793343861897786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,power_law_1.01,0.5044608116149902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.01,10.489568328857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,2,power_law_1.2,0.3541696071624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,2,power_law_1.2,0.35050239562988283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,power_law_1.01,0.5759103775024415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,2,power_law_1.2,0.431660795211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,balanced,9.714330673217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,power_law_1.01,0.7815743923187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,2,power_law_1.2,0.4731071949005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,power_law_1.01,0.9234880447387696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,2,power_law_1.2,0.545689582824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,balanced,3.9483893712361655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,power_law_1.01,1.2589823722839355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,2,power_law_1.2,0.6185855865478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,power_law_1.01,1.609542465209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,2,power_law_1.2,0.7958591938018799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,power_law_1.01,2.269055938720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,2,power_law_1.2,0.9430080413818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,power_law_1.01,3.0611904144287108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,2,power_law_1.2,1.387833595275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,power_law_1.01,4.598502349853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,2,power_law_1.2,1.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,power_law_1.01,5.815731048583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,balanced,5.226906776428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,2,power_law_1.2,2.342905616760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,power_law_1.01,6.9338432312011715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,2,power_law_1.2,0.053465598821640016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,2,power_law_1.2,2.859507179260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,power_law_1.01,12.155974578857421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,2,power_law_1.2,0.06120319962501526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,2,power_law_1.2,3.7858303070068358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,2,power_law_1.2,0.058195197582244874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,2,power_law_1.2,0.07389439940452576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,2,power_law_1.2,5.662572860717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,power_law_1.01,23.043589782714843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,2,power_law_1.2,0.09459199905395507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,2,power_law_1.2,0.11519360542297363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,2,power_law_1.2,12.973049926757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,2,power_law_1.2,0.1555392026901245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,balanced,6.535615921020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,2,power_law_1.2,0.16310399770736694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,2,power_law_1.2,0.16972800493240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,balanced,9.428890864054361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,2,power_law_1.2,0.17416319847106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,2,power_law_1.2,0.18731520175933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,2,power_law_1.2,0.1972607970237732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,2,power_law_1.2,0.20592000484466552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,2,power_law_1.2,0.23292160034179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,2,power_law_1.2,0.24396800994873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,2,power_law_1.2,0.25632638931274415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,2,power_law_1.2,0.27005441188812257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,2,power_law_1.2,0.3208319902420044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,balanced,10.32368532816569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,2,power_law_1.2,0.3579904079437256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,2,power_law_1.2,0.41547517776489257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,2,power_law_1.2,0.5068223953247071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,2,power_law_1.2,0.6454016208648682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,2,power_law_1.2,0.79584641456604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,2,power_law_1.2,1.1276543617248536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,2,power_law_1.2,1.4338239669799804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,2,power_law_1.2,2.129759979248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,2,power_law_1.2,2.746348762512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,2,power_law_1.2,3.5179519653320312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,2,power_law_1.2,5.503379058837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,2,power_law_1.2,11.4498046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,balanced,20.439008076985676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,balanced,0.06366399923960368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,2,power_law_1.2,0.08178560137748718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,balanced,0.08255999783674876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,2,power_law_1.2,0.09222400188446045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,balanced,0.0940053363641103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,balanced,0.05884799857934316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,balanced,0.13111467162768045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,2,power_law_1.2,0.08945279717445373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,balanced,0.20151466131210327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,2,power_law_1.2,0.10762879848480225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,balanced,0.33419732252756756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,balanced,0.06351466476917267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,2,power_law_1.2,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,balanced,0.3386933406194051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,balanced,0.34061332543691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,balanced,0.07602666815121968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,2,power_law_1.2,0.14620800018310548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,balanced,0.3442293405532837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,2,power_law_1.2,0.19041919708251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,balanced,0.34720532099405926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,balanced,0.1132319966952006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,2,power_law_1.2,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,balanced,0.35096001625061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,balanced,0.17012266318003336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,balanced,0.3601333300272624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,2,power_law_1.2,0.20647680759429932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,balanced,0.3652799924214681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,balanced,0.2842666705449422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,2,power_law_1.2,0.2151871919631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,balanced,0.3744106690088908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,balanced,0.28827200333277386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,2,power_law_1.2,0.23768320083618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,balanced,0.38701868057250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,balanced,0.2893706758817037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,balanced,0.39427733421325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,2,power_law_1.2,0.24920320510864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,balanced,0.2950399915377299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,balanced,0.4158560037612915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,2,power_law_1.2,0.2687040090560913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,balanced,0.48017601172129315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,2,power_law_1.2,0.2977407932281494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,balanced,0.29546133677164715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,2,power_law_1.2,0.3270591974258423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,balanced,0.5541013479232788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,2,power_law_1.2,0.3481856107711792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,balanced,0.2965493400891622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,balanced,0.6655360062917074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,2,power_law_1.2,0.4134079933166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.059494400024414064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,balanced,0.3062293330828349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,balanced,0.7727999687194824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.08112000226974488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,balanced,0.3124319911003113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.07678080201148987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,2,power_law_1.2,0.5270400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,balanced,1.069050629933675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.11291520595550537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,balanced,0.3195893367131551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.15207040309906006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,2,power_law_1.2,0.5857279777526856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,balanced,1.3944320678710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,balanced,0.33089067538579303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.1905087947845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.05370240211486817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,2,power_law_1.2,0.7751232147216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.24697599411010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,balanced,0.33661333719889325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.06593279838562012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,2,power_law_1.2,0.9499903678894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.264736008644104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,balanced,0.36618133385976154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.06751999855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,balanced,2.0221120516459146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,2,power_law_1.2,1.3117055892944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.2742784023284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,balanced,0.4302346706390381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.09623039960861206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,2,power_law_1.2,1.6545856475830079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.275545597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.1243008017539978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,balanced,0.4991519848505656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,2,power_law_1.2,2.428620719909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.30426878929138185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.15607680082321168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,2,power_law_1.2,2.973222351074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,balanced,0.5771306753158569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.3104127883911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,balanced,2.519968032836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.21101438999176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.3223615884780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,2,power_law_1.2,4.898220825195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.22699520587921143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,balanced,0.666266679763794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.23030400276184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.3406208038330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,2,power_law_1.2,5.966393661499024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.2400576114654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.3578304052352905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,balanced,0.9649600187937418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,2,power_law_1.2,7.1708732604980465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.2535232067108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.38153600692749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.2739264011383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.41361279487609864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,balanced,3.7114292780558267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,2,power_law_1.2,12.074361419677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.2880064010620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.5267199993133544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,balanced,1.2465973695119221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.3109888076782227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.5955904006958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.34149119853973386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.7804224014282226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,2,power_law_1.2,23.145126342773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.369215989112854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,balanced,1.8264959653218586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.8487423896789551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.3823807954788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.01,1.0807807922363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.4620543956756592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.01,1.3102399826049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,0.5027584075927735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,balanced,4.421525319417317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,0.6132800102233886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.01,1.8574848175048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,balanced,2.3738452593485513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,0.7230144023895264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.01,2.370636749267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,0.9372159957885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.01,3.456620788574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,1.1979071617126464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.01,4.396851348876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,1.6653568267822265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.01,5.49552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,balanced,3.550506591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,2.2180736541748045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.01,8.329759979248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,3.269728088378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,balanced,5.688714981079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,4.178291320800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.01,16.256646728515626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.01,5.334444808959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.01,8.684255981445313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,balanced,4.246426582336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.01,15.486834716796874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.07896320223808288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.10853760242462158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.1385599970817566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.17460479736328124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.24325759410858155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.2553663969039917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.2666111946105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,balanced,8.283333460489908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,balanced,5.518063863118489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.2967679977416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.31269121170043945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.32928640842437745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.34202880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.3593983888626099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.4105855941772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.43442559242248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.5440832138061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.6471936225891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.7788864135742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.861292839050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,1,power_law_1.2,1.0911935806274413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,balanced,8.31273078918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,1,power_law_1.2,1.376467227935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.9210624694824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,1,power_law_1.2,2.39816951751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,1,power_law_1.2,3.5260414123535155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,1,power_law_1.2,4.560428619384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,1,power_law_1.2,5.800844955444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,1,power_law_1.2,8.283999633789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,power_law_1.2,16.090541076660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,1,balanced,16.6211675008138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,balanced,15.859125773111979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.05384320020675659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.06633599996566772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.06863999962806702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.09333119988441467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.11758719682693482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.1435968041419983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.20787200927734376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.21678719520568848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.22803199291229248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.24033920764923095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.25515520572662354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.2744064092636108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.287007999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,balanced,0.025013332565625507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.3216063976287842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,balanced,0.024559999505678814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.34990720748901366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,balanced,0.024522667129834492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.3773567914962769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,balanced,0.027562665442625683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,balanced,0.03175999969244003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.3931071996688843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.4622015953063965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,balanced,0.030965333183606465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,balanced,0.031114667654037476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,0.5235007762908935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,balanced,0.03136533250411352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,balanced,0.030421334008375805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,balanced,0.0331839993596077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,0.6347263813018799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,balanced,0.0305226668715477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,balanced,0.03461333364248276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,0.7416639804840088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,balanced,0.03290133426586787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,balanced,0.03421333432197571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,balanced,0.03473600000143051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,0.9716544151306152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,balanced,0.033376000821590424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,balanced,0.03640533238649368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,balanced,0.03558400024970373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,1.2180416107177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,balanced,0.03654933224121729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,1.7344255447387695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,balanced,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,balanced,0.043354665239652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,balanced,0.036602665980656944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,2.2563520431518556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,balanced,0.04517866671085358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,balanced,0.03658666710058848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,3.3484352111816404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,balanced,0.03702399879693985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,balanced,0.04470400015513102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,balanced,0.037733333806196846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,4.3197887420654295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,balanced,0.04901866614818573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,1,power_law_1.2,5.533407974243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,balanced,0.03882666677236557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,balanced,0.051216001311937966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,balanced,0.04127466678619385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,balanced,0.052890668312708534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,1,power_law_1.2,8.84853744506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,balanced,0.041349334021409355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,balanced,0.0555626650651296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,balanced,0.04159466673930486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,balanced,0.04545066754023234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,1,power_law_1.2,15.616294860839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,balanced,0.057349334160486855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,balanced,0.04478933413823446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,balanced,0.02378133436044057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,balanced,0.023786666492621105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,balanced,0.05818133552869161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,balanced,0.06623999774456024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,balanced,0.023914667467276256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,balanced,0.02643733223279317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,balanced,0.06180266539255778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,balanced,0.028149334092934925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,balanced,0.0710453341404597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,balanced,0.029818666477998097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,balanced,0.0746506651242574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,balanced,0.03011200080315272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,balanced,0.02975466599067052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,balanced,0.08906132976214091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,balanced,0.08588266372680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,balanced,0.029872000217437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,balanced,0.030410667260487873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,balanced,0.030581332743167877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,balanced,0.03048533449570338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,balanced,0.1095413366953532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,balanced,0.031632001201311745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,balanced,0.09704533219337463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,balanced,0.032032000521818794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,balanced,0.03468266626199087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,balanced,0.034458667039871216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,balanced,0.1260586678981781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,power_law_1.01,0.03110400140285492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,balanced,0.1388746698697408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,power_law_1.01,0.03688960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,balanced,0.035173334181308746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,power_law_1.01,0.02871679961681366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,power_law_1.01,0.027136000990867614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,power_law_1.01,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,balanced,0.03989866624275843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,power_law_1.01,0.030713599920272828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,balanced,0.1777226726214091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,power_law_1.01,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,power_law_1.01,0.032390400767326355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,balanced,0.03844800094763438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,power_law_1.01,0.0328000009059906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,power_law_1.01,0.03248000144958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,power_law_1.01,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,power_law_1.01,0.03729279935359955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,power_law_1.01,0.033606401085853575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,power_law_1.01,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,power_law_1.01,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,power_law_1.01,0.0385343998670578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,balanced,0.1611199975013733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,power_law_1.01,0.03940480053424835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,power_law_1.01,0.03535360097885132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,balanced,0.048783997694651283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,power_law_1.01,0.04108799993991852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,power_law_1.01,0.036339199542999266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,power_law_1.01,0.04656639993190766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,power_law_1.01,0.05053439736366272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,balanced,0.05147199829419454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,power_law_1.01,0.036185601353645326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,balanced,0.21494932969411215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,power_law_1.01,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,power_law_1.01,0.036959999799728395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,power_law_1.01,0.05418879985809326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,power_law_1.01,0.0385919988155365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,power_law_1.01,0.07051519751548767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,power_law_1.01,0.04008319973945618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,power_law_1.01,0.08787199854850769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,power_law_1.01,0.04079999923706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,power_law_1.01,0.08156800270080566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,balanced,0.06740800042947133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,power_law_1.01,0.04625920057296753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,power_law_1.01,0.10341119766235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,power_law_1.01,0.04859519898891449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,balanced,0.18424000342686972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,power_law_1.01,0.12659840583801268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,power_law_1.01,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,power_law_1.01,0.024505600333213806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,balanced,0.07566933333873749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,power_law_1.01,0.18954240083694457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,power_law_1.01,0.06500480175018311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,power_law_1.01,0.024198399484157564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,power_law_1.01,0.06531839966773986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,power_law_1.01,0.20806400775909423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,balanced,0.2552000085512797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,power_law_1.01,0.026444798707962035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,power_law_1.01,0.07936000227928161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,power_law_1.01,0.3182719945907593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,power_law_1.01,0.08917760252952575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,power_law_1.01,0.026668798923492432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,power_law_1.01,0.4384960174560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,power_law_1.01,0.11609599590301514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,power_law_1.01,0.12147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,power_law_1.01,0.028089600801467895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,power_law_1.01,0.5033279895782471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,power_law_1.01,0.1829375982284546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,power_law_1.01,0.02839039862155914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,power_law_1.01,0.7620800018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,power_law_1.01,0.22708480358123778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,power_law_1.01,0.33752319812774656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,balanced,0.09773332873980205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,power_law_1.01,1.6885696411132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,power_law_1.01,0.40828800201416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,power_law_1.01,0.0313728004693985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,power_law_1.01,0.5031807899475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,power_law_1.01,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,power_law_1.01,0.8048128128051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,power_law_1.01,0.03408640027046204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,32,power_law_1.2,0.030636799335479737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,power_law_1.01,0.038201600313186646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,power_law_1.01,1.5723711967468261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,balanced,0.11823466420173645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,balanced,0.26786667108535767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,power_law_1.01,0.04336000084877014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,32,power_law_1.2,0.027001601457595826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,power_law_1.01,0.045388799905776975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,32,power_law_1.2,0.027884799242019653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,balanced,0.3866560061772664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,power_law_1.01,0.04644480049610138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,32,power_law_1.2,0.028300800919532777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,power_law_1.01,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,balanced,0.16230400403340658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,power_law_1.01,0.06651520133018493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,32,power_law_1.2,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,32,power_law_1.2,0.030291199684143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,power_law_1.01,0.08156160116195679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,32,power_law_1.2,0.03559040129184723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,power_law_1.01,0.09127039909362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,32,power_law_1.2,0.038553598523139956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,32,power_law_1.2,0.035392001271247864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,power_law_1.01,0.11976319551467896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,32,power_law_1.2,0.03816959857940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,power_law_1.01,0.14765440225601195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,balanced,0.20562666654586792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,32,power_law_1.2,0.03878400027751923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,32,power_law_1.2,0.04068480134010315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,32,power_law_1.2,0.04173440039157868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,power_law_1.01,0.24605441093444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,32,power_law_1.2,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,power_law_1.01,0.30458879470825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,power_law_1.01,0.41081600189208983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,32,power_law_1.2,0.0525056004524231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,32,power_law_1.2,0.05911039710044861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,power_law_1.01,0.5674240112304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,32,power_law_1.2,0.05546240210533142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,32,power_law_1.2,0.06972159743309021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,32,power_law_1.2,0.07703040242195129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,32,power_law_1.2,0.09514880180358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,power_law_1.01,0.7818431854248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,balanced,0.2585493326187134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,32,power_law_1.2,0.0377023994922638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,32,power_law_1.2,0.11168639659881592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,power_law_1.01,1.2541184425354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,32,power_law_1.2,0.03356800079345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,32,power_law_1.2,0.14258559942245483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,power_law_1.01,2.5680192947387694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,32,power_law_1.2,0.031788799166679385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,balanced,0.4973599910736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,32,power_law_1.2,0.1509503960609436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,32,power_law_1.2,0.032441601157188416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,32,power_law_1.2,0.2082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,32,power_law_1.2,0.033011201024055484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,32,power_law_1.2,0.2821120023727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,balanced,0.7301386992136637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,32,power_law_1.2,0.035046398639678955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,32,power_law_1.2,0.4888000011444092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,32,power_law_1.2,0.035257598757743834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,32,power_law_1.2,0.6390975952148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,32,power_law_1.2,0.0356799989938736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,32,power_law_1.2,0.8403519630432129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,32,power_law_1.2,0.03628160059452057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,32,power_law_1.2,1.277280044555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,32,power_law_1.2,0.03608959913253784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,balanced,0.41910401980082196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,32,power_law_1.2,0.038047999143600464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,32,power_law_1.2,2.8160127639770507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,32,power_law_1.2,0.03901439905166626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,32,power_law_1.2,0.04294399917125702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,32,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,32,power_law_1.2,0.04968959987163544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,32,power_law_1.2,0.05141119956970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,32,power_law_1.2,0.05616000294685364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,32,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,32,power_law_1.2,0.07033600211143494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,32,power_law_1.2,0.089055997133255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,32,power_law_1.2,0.0955136001110077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,32,power_law_1.2,0.12639360427856444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,32,power_law_1.2,0.14642560482025146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,32,power_law_1.2,0.20782721042633057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,32,power_law_1.2,0.2618304014205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,32,power_law_1.2,0.44128642082214353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,32,power_law_1.2,0.6487936019897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,32,power_law_1.2,0.7594880104064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,32,power_law_1.2,1.452723217010498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,32,power_law_1.2,3.342015838623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,balanced,0.8266613483428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,balanced,0.023002666731675465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,balanced,0.022874665757020313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,balanced,0.023029332359631855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,balanced,0.02646933247645696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,balanced,0.033813332517941795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,balanced,0.03490666548411051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,32,power_law_1.2,0.02685439884662628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,balanced,0.035599999129772186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,32,power_law_1.2,0.024300800263881685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,balanced,0.03573333223660787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,balanced,0.03333866596221924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,32,power_law_1.2,0.024031999707221984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,balanced,0.035391998787721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,32,power_law_1.2,0.026495999097824095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,balanced,0.0373279998699824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,32,power_law_1.2,0.027212798595428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,32,power_law_1.2,0.029894399642944335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,balanced,0.03676799933115641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,32,power_law_1.2,0.02956160008907318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,balanced,0.03701333453257879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,balanced,0.039546666045983635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,32,power_law_1.2,0.03000960052013397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,balanced,0.04496533175309499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,32,power_law_1.2,0.030131199955940248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,balanced,0.045647998650868736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,32,power_law_1.2,0.030079999566078187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,balanced,0.04735999802748362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,32,power_law_1.2,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,32,power_law_1.2,0.03287039995193482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,balanced,0.05564799904823303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,32,power_law_1.2,0.03463039994239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,32,power_law_1.2,0.038406398892402646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,balanced,0.06055466830730438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,32,power_law_1.2,0.04747520089149475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,32,power_law_1.2,0.0471807986497879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,balanced,0.0613919993241628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,32,power_law_1.2,0.049235200881958006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,balanced,0.07144000132878621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,balanced,0.030192000170548756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,32,power_law_1.2,0.06625279784202576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,balanced,0.029616000751654308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,32,power_law_1.2,0.07708799839019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,balanced,0.03125333289305369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,balanced,0.07659733295440674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,balanced,0.033045334120591484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,balanced,0.03427733232577642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,balanced,0.035749333600203194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,32,power_law_1.2,0.09473919868469238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,balanced,0.10107200344403584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,32,power_law_1.2,0.11404160261154175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,balanced,0.035877334574858345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,balanced,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,32,power_law_1.2,0.15420160293579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,balanced,0.03702933341264725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,32,power_law_1.2,0.19343359470367433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,power_law_1.01,0.032416000962257385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,balanced,0.11287466684977214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,balanced,0.0373279998699824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,power_law_1.01,0.026617598533630372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,balanced,0.03791466603676478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,32,power_law_1.2,0.2974720001220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,power_law_1.01,0.025254398584365845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,balanced,0.03984533250331879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,power_law_1.01,0.029337599873542786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,balanced,0.041002665956815086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,32,power_law_1.2,0.4757567882537842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,power_law_1.01,0.03131519854068756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,balanced,0.04080000023047129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,32,power_law_1.2,0.5799488067626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,balanced,0.16451733311017355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,power_law_1.01,0.03351039886474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,balanced,0.02421333392461141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,balanced,0.04221866528193156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,32,power_law_1.2,1.101740837097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,power_law_1.01,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,balanced,0.024218666056791942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,balanced,0.04763199885686239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,power_law_1.01,0.03400320112705231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,balanced,0.024720000723997753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,32,power_law_1.2,1.1534144401550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,balanced,0.04711999992529551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,power_law_1.01,0.03484799861907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,balanced,0.027290667096773785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,power_law_1.01,0.038438400626182555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,balanced,0.028405333558718365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,32,power_law_1.2,2.696147155761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,balanced,0.06001600126425425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,balanced,0.030026666820049286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,power_law_1.01,0.0414463996887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,power_law_1.01,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,balanced,0.030224000414212544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,32,power_law_1.2,4.876512145996093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,power_law_1.01,0.032652801275253295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,power_law_1.01,0.04293760061264038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,balanced,0.06676800052324931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,balanced,0.19805334011713663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,power_law_1.01,0.03268480002880096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,balanced,0.03001066545645396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,power_law_1.01,0.04412800073623657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,power_law_1.01,0.03309440016746521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,balanced,0.030074665943781536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,power_law_1.01,0.04594559967517853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,balanced,0.08098666866620381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,power_law_1.01,0.03526400029659271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,balanced,0.030746666093667347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,power_law_1.01,0.05069440007209778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,power_law_1.01,0.03555200099945068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,power_law_1.01,0.03551360070705414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,power_law_1.01,0.05310080051422119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,balanced,0.03073599934577942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,power_law_1.01,0.03738879859447479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,balanced,0.092357337474823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,power_law_1.01,0.05921279788017273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,balanced,0.03176533430814743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,power_law_1.01,0.03790079951286316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,power_law_1.01,0.03841919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,power_law_1.01,0.06710399985313416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,balanced,0.032586666444937386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,power_law_1.01,0.03903999924659729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,power_law_1.01,0.07056000232696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,balanced,0.03295466552178065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,power_law_1.01,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,balanced,0.12168000141779582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,power_law_1.01,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,power_law_1.01,0.07947520017623902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,power_law_1.01,0.04814079999923706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,balanced,0.23056532939275107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,power_law_1.01,0.08391039967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,balanced,0.03755733370780945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,power_law_1.01,0.047942399978637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,balanced,0.03675200045108795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,power_law_1.01,0.10992640256881714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,power_law_1.01,0.05275520086288452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,power_law_1.01,0.06407679915428162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,balanced,0.142794668674469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,power_law_1.01,0.13173120021820067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,power_law_1.01,0.06525440216064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,power_law_1.01,0.15800319910049437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,power_law_1.01,0.08021759986877441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,power_law_1.01,0.20867199897766114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,power_law_1.01,0.09479039907455444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,power_law_1.01,0.2903167963027954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,power_law_1.01,0.11419520378112794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,balanced,0.03773866593837738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,power_law_1.01,0.13665920495986938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,16,power_law_1.2,0.02961280047893524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,power_law_1.01,0.3738816022872925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,power_law_1.01,0.17560319900512694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,balanced,0.0439626673857371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,power_law_1.01,0.43788161277771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,16,power_law_1.2,0.023155200481414794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,power_law_1.01,0.21086080074310304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,balanced,0.20335467656453451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,power_law_1.01,0.3088128089904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,16,power_law_1.2,0.023238399624824525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,balanced,0.04533866544564565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,power_law_1.01,0.8023807525634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,power_law_1.01,0.028070399165153505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,power_law_1.01,0.4455423831939697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,16,power_law_1.2,0.02691200077533722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,power_law_1.01,0.5429503917694092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,power_law_1.01,1.3858048439025878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,power_law_1.01,0.026015999913215637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,16,power_law_1.2,0.029606398940086365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,power_law_1.01,0.8150848388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,power_law_1.01,0.024889600276947022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,16,power_law_1.2,0.03113600015640259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,balanced,0.3447786569595337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,power_law_1.01,0.026892799139022826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,power_law_1.01,1.7792320251464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,16,power_law_1.2,0.031097599864006044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,power_law_1.01,0.02858879864215851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,balanced,0.06247999767462412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,16,power_law_1.2,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,balanced,0.2549546758333842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,power_law_1.01,0.02985599935054779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,16,power_law_1.2,0.034796801209449765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,power_law_1.01,0.029951998591423036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,16,power_law_1.2,0.03829120099544525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,power_law_1.01,0.03036159873008728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,16,power_law_1.2,0.04296320080757141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,power_law_1.01,0.03200640082359314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,balanced,0.0817333310842514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,16,power_law_1.2,0.043059200048446655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,16,power_law_1.2,0.04413439929485321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,power_law_1.01,0.03375999927520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,power_law_1.01,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,balanced,0.0941546658674876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,16,power_law_1.2,0.0471807986497879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,power_law_1.01,0.037222400307655334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,16,power_law_1.2,0.05308799743652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,balanced,0.3055359919865926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,power_law_1.01,0.040191999077796935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,16,power_law_1.2,0.05489919781684875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,16,power_law_1.2,0.06524800062179566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,power_law_1.01,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,16,power_law_1.2,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,power_law_1.01,0.04780800044536591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,16,power_law_1.2,0.07605760097503662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,balanced,0.1269760032494863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,16,power_law_1.2,0.08814719915390015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,16,power_law_1.2,0.09651200175285339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,power_law_1.01,0.05069440007209778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,16,power_law_1.2,0.11310720443725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,power_law_1.01,0.06172800064086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,16,power_law_1.2,0.1485759973526001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,power_law_1.01,0.06932479739189149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,balanced,0.155349334081014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,16,power_law_1.2,0.2041088104248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,power_law_1.01,0.08325759768486023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,16,power_law_1.2,0.24136319160461425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,power_law_1.01,0.10007679462432861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,16,power_law_1.2,0.3802815914154053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,balanced,0.4776906569798787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,16,power_law_1.2,0.5247807979583741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,balanced,0.6397973299026489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,power_law_1.01,0.1359935998916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,balanced,0.23385600248972574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,16,power_law_1.2,0.6274367809295655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,power_law_1.01,0.16017279624938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,16,power_law_1.2,1.0480640411376954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,power_law_1.01,0.25696001052856443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,16,power_law_1.2,2.2304576873779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,power_law_1.01,0.3146752119064331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,power_law_1.01,0.45759358406066897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,power_law_1.01,0.5923647880554199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,balanced,0.3112213412920634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,power_law_1.01,0.7272511959075928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,power_law_1.01,1.1227456092834474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,power_law_1.01,2.5534975051879885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,balanced,0.38334401448567706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,balanced,0.9091200033823649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,16,power_law_1.2,0.03715200126171112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,16,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,16,power_law_1.2,0.03180800080299377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,balanced,0.5913653373718262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,16,power_law_1.2,0.03219839930534363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,16,power_law_1.2,0.03326080143451691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,16,power_law_1.2,0.034835198521614076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,16,power_law_1.2,0.03557760119438171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,16,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,16,power_law_1.2,0.037241598963737486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,16,power_law_1.2,0.037862399220466615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,16,power_law_1.2,0.03800959885120392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,16,power_law_1.2,0.03904640078544617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,16,power_law_1.2,0.04176000058650971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,16,power_law_1.2,0.041503998637199405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,16,power_law_1.2,0.050316798686981204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,16,power_law_1.2,0.051577597856521606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,16,power_law_1.2,0.05370879769325256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,16,power_law_1.2,0.06627839803695679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,16,power_law_1.2,0.06837760210037232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,16,power_law_1.2,0.08563200235366822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,16,power_law_1.2,0.10454399585723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,16,power_law_1.2,0.11736960411071777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,16,power_law_1.2,0.14357119798660278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,16,power_law_1.2,0.24208641052246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,16,power_law_1.2,0.259769606590271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,16,power_law_1.2,0.39872639179229735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,16,power_law_1.2,0.5933248043060303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,16,power_law_1.2,0.6830336093902588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,balanced,0.022954667607943218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,16,power_law_1.2,1.339750385284424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,balanced,0.022842665513356526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,balanced,0.023765332996845245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,16,power_law_1.2,2.269094467163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,balanced,0.027978666126728058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,balanced,0.033200000723203026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,balanced,0.034485332667827606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,balanced,1.1721759637196858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,16,power_law_1.2,0.026995199918746948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,balanced,0.03519999980926514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,balanced,0.03561066587766012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,16,power_law_1.2,0.02513279914855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,balanced,0.03282133241494497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,16,power_law_1.2,0.02503040134906769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,balanced,0.03568533311287562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,16,power_law_1.2,0.027116799354553224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,16,power_law_1.2,0.027846398949623107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,balanced,0.03489600121974945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,16,power_law_1.2,0.029068800806999206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,balanced,0.03788266579310099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,16,power_law_1.2,0.028998398780822755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,balanced,0.040778666734695435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,16,power_law_1.2,0.030342400074005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,balanced,0.046341334780057274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,16,power_law_1.2,0.031385600566864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,balanced,0.04622933268547058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,16,power_law_1.2,0.032051199674606325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,balanced,0.050373335679372154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,16,power_law_1.2,0.03323520123958588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,balanced,0.059061333537101746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,16,power_law_1.2,0.03475199937820435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,16,power_law_1.2,0.03653120100498199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,balanced,0.05809600154558817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,16,power_law_1.2,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,balanced,0.06679466863473256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,balanced,0.030671998858451843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,16,power_law_1.2,0.04433279931545257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,16,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,balanced,0.07077866792678833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,balanced,0.030224000414212544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,balanced,0.0317546675602595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,balanced,0.08496000369389851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,16,power_law_1.2,0.053504002094268796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,balanced,0.034917332231998444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,16,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,balanced,0.037130666275819145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,balanced,0.038346665600935616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,balanced,0.09200533231099446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,16,power_law_1.2,0.07487360239028931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,balanced,0.03895466774702072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,balanced,0.038431999584039055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,16,power_law_1.2,0.08947839736938476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,balanced,0.03849600007136663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,balanced,0.12598933776219687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,16,power_law_1.2,0.11399680376052856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,balanced,0.039077334105968475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,balanced,0.039520000418027244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,16,power_law_1.2,0.1415168046951294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,balanced,0.03976000100374222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,16,power_law_1.2,0.2074944019317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,balanced,0.15037332971890768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,balanced,0.04098133246103922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,power_law_1.01,0.026899200677871705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,balanced,0.02534399926662445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,balanced,0.04417066772778829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,16,power_law_1.2,0.32848639488220216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,power_law_1.01,0.024332800507545473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,balanced,0.026357332865397137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,balanced,0.044394666949907936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,power_law_1.01,0.023705600202083586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,16,power_law_1.2,0.43235201835632325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,balanced,0.026752000053723652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,power_law_1.01,0.030348798632621764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,balanced,0.04507733384768168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,balanced,0.03009066730737686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,16,power_law_1.2,0.6587264060974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,power_law_1.01,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,balanced,0.03201599915822347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,balanced,0.05192000170548757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,power_law_1.01,0.031007999181747438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,balanced,0.22535999615987143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,16,power_law_1.2,0.7645823955535889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,power_law_1.01,0.03195520043373108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,balanced,0.03355200091997782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,balanced,0.051183998584747314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,16,power_law_1.2,1.46943998336792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,power_law_1.01,0.03182719945907593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,balanced,0.03349333256483078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,power_law_1.01,0.0333759993314743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,16,power_law_1.2,2.1535104751586913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,balanced,0.03349866718053818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,power_law_1.01,0.0344895988702774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,balanced,0.0683840016523997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,balanced,0.03412266572316488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,power_law_1.01,0.037536001205444335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,power_law_1.01,0.039052799344062805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,balanced,0.03484266748030981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,16,power_law_1.2,5.0843456268310545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,balanced,0.07764799892902374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,power_law_1.01,0.041203200817108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,balanced,0.03493333359559377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,power_law_1.01,0.04766719937324524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,balanced,0.03614933292071024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,balanced,0.2714986602465312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,power_law_1.01,0.05300480127334595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,balanced,0.0367999995748202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,balanced,0.0965280036131541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,power_law_1.01,0.05472639799118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,balanced,0.037402667105197906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,power_law_1.01,0.05953279733657837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,power_law_1.01,0.06600959897041321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,power_law_1.01,0.03509120047092438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,power_law_1.01,0.07146239876747132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,balanced,0.10866133371988933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,balanced,0.04285866518815359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,power_law_1.01,0.030662399530410767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,power_law_1.01,0.07735679745674133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,power_law_1.01,0.0918720006942749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,balanced,0.0429013321797053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,power_law_1.01,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,power_law_1.01,0.11443840265274048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,power_law_1.01,0.034176000952720643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,power_law_1.01,0.12664320468902587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,balanced,0.14881599942843118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,power_law_1.01,0.16328959465026854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,power_law_1.01,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,balanced,0.3388959964116414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,power_law_1.01,0.2128063917160034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,power_law_1.01,0.31631999015808104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,balanced,0.04550399879614512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,power_law_1.01,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,power_law_1.01,0.3878015995025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,balanced,0.05386666456858317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,power_law_1.01,0.03839359879493713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,balanced,0.18659732739130655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,power_law_1.01,0.5096127986907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,power_law_1.01,0.03841919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,balanced,0.0568800022204717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,power_law_1.01,0.8562175750732421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,power_law_1.01,0.03943679928779602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,power_law_1.01,1.7817407608032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,power_law_1.01,0.040243199467658995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,power_law_1.01,0.04156799912452698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,power_law_1.01,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,balanced,0.07431999842325847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,power_law_1.01,0.042777600884437564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,power_law_1.01,0.04535680115222931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,balanced,0.27481599648793537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,balanced,0.08297599852085114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,power_law_1.01,0.05062400102615357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,power_law_1.01,0.05560960173606873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,power_law_1.01,0.06716160178184509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,balanced,0.5261973142623901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,power_law_1.01,0.0685696005821228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,power_law_1.01,0.08256000280380249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,balanced,0.11006933450698853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,power_law_1.01,0.09872000217437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,power_law_1.01,0.12565759420394898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,power_law_1.01,0.14911359548568726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,balanced,0.3523413340250651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,balanced,0.1327306628227234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,power_law_1.01,0.2100543975830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,power_law_1.01,0.26496639251708987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,power_law_1.01,0.3524672031402588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,power_law_1.01,0.48360958099365237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,power_law_1.01,0.6270527839660645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,power_law_1.01,1.0632960319519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,balanced,0.1996799906094869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,power_law_1.01,1.9912832260131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,8,power_law_1.2,0.026617598533630372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,balanced,0.43598934014638263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,8,power_law_1.2,0.022329600155353548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,8,power_law_1.2,0.023628799617290495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,balanced,0.26128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,8,power_law_1.2,0.028512001037597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,power_law_1.01,0.026867198944091796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,8,power_law_1.2,0.028403198719024657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,power_law_1.01,0.02910720109939575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,8,power_law_1.2,0.03155199885368347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,power_law_1.01,0.031481599807739256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,8,power_law_1.2,0.03313280045986176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,power_law_1.01,0.03315199911594391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,8,power_law_1.2,0.035820800065994265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,power_law_1.01,0.03364480137825012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,balanced,0.3756800095240275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,8,power_law_1.2,0.03391999900341034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,power_law_1.01,0.03498879969120026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,8,power_law_1.2,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,power_law_1.01,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,8,power_law_1.2,0.038201600313186646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,power_law_1.01,0.03671680092811584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,8,power_law_1.2,0.040249601006507874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,8,power_law_1.2,0.04266240000724793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,power_law_1.01,0.038361600041389464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,8,power_law_1.2,0.0486272007226944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,power_law_1.01,0.04043520092964172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,balanced,0.9686773618062338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,8,power_law_1.2,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,power_law_1.01,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,8,power_law_1.2,0.05449600219726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,power_law_1.01,0.04317440092563629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,balanced,0.6944853464762369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,8,power_law_1.2,0.06204800009727478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,balanced,0.48892800013224286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,power_law_1.01,0.05028480291366577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,8,power_law_1.2,0.0720192015171051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,power_law_1.01,0.054611200094223024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,8,power_law_1.2,0.07508479952812194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,8,power_law_1.2,0.08398720026016235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,power_law_1.01,0.05783680081367493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,8,power_law_1.2,0.0952127993106842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,power_law_1.01,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,power_law_1.01,0.08289920091629029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,8,power_law_1.2,0.1334720015525818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,8,power_law_1.2,0.13982080221176146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,power_law_1.01,0.09500160217285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,power_law_1.01,0.1161471962928772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,8,power_law_1.2,0.19275519847869874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,balanced,0.6075786749521891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,8,power_law_1.2,0.27799038887023925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,power_law_1.01,0.1499519944190979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,8,power_law_1.2,0.35852799415588377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,power_law_1.01,0.21294078826904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,8,power_law_1.2,0.5519231796264649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,power_law_1.01,0.32527999877929686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,8,power_law_1.2,0.788428783416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,power_law_1.01,0.36611199378967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,8,power_law_1.2,1.210912036895752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,power_law_1.01,0.6572224140167237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,power_law_1.01,0.7703743934631347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,power_law_1.01,1.01278076171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,8,power_law_1.2,2.6765567779541017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,power_law_1.01,1.5749695777893067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,power_law_1.01,3.186623954772949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,balanced,0.9464960098266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,balanced,1.2911252975463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,8,power_law_1.2,0.03424000144004822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,8,power_law_1.2,0.030048000812530517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,8,power_law_1.2,0.030163198709487915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,8,power_law_1.2,0.03240320086479187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,8,power_law_1.2,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,8,power_law_1.2,0.036006399989128114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,8,power_law_1.2,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,8,power_law_1.2,0.03759360015392303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,8,power_law_1.2,0.038553598523139956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,8,power_law_1.2,0.03934719860553741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,8,power_law_1.2,0.03994239866733551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,8,power_law_1.2,0.04270719885826111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,8,power_law_1.2,0.04521600008010864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,8,power_law_1.2,0.04296320080757141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,8,power_law_1.2,0.04865919947624207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,8,power_law_1.2,0.05167359709739685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,8,power_law_1.2,0.05916159749031067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,8,power_law_1.2,0.06850559711456299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,8,power_law_1.2,0.07152640223503112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,8,power_law_1.2,0.09308800101280212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,8,power_law_1.2,0.10590720176696777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,8,power_law_1.2,0.13570560216903688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,8,power_law_1.2,0.15422719717025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,8,power_law_1.2,0.21327359676361085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,balanced,1.8763093948364258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,8,power_law_1.2,0.028575998544692994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,8,power_law_1.2,0.341427206993103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,8,power_law_1.2,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,8,power_law_1.2,0.02687999904155731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,8,power_law_1.2,0.6280064105987548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,8,power_law_1.2,0.8099455833435059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,8,power_law_1.2,0.02705279886722565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,8,power_law_1.2,1.475327968597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,8,power_law_1.2,0.029926401376724244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,8,power_law_1.2,2.727609634399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,8,power_law_1.2,0.03086720108985901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,8,power_law_1.2,0.03386879861354828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,8,power_law_1.2,0.03456639945507049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,8,power_law_1.2,0.03498879969120026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,balanced,0.04509866734345754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,8,power_law_1.2,0.03578880131244659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,balanced,0.04274133344491323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,8,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,balanced,0.0431573341290156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,8,power_law_1.2,0.038464000821113585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,8,power_law_1.2,0.040780800580978396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,balanced,0.07730133334795634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,8,power_law_1.2,0.04161919951438904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,balanced,0.07820266485214233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,8,power_law_1.2,0.04670720100402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,balanced,0.07886399825414021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,balanced,0.07948799928029378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,balanced,0.0796319991350174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,8,power_law_1.2,0.04947839975357056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,8,power_law_1.2,0.05568000078201294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,balanced,0.07941866914431255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,balanced,0.08084799846013387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,balanced,0.08160533507664998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,8,power_law_1.2,0.06021760106086731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,balanced,0.082096000512441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,8,power_law_1.2,0.06828799843788147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,8,power_law_1.2,0.08490239977836608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,balanced,0.03679466744263967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,balanced,0.08936533331871033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,balanced,0.09238933523495992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,balanced,0.03674133370320002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,8,power_law_1.2,0.10884480476379395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,balanced,0.03695466617743174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,balanced,0.09311999877293904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,balanced,0.04338666796684265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,8,power_law_1.2,0.11943680047988892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,balanced,0.05936000247796377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,balanced,0.095551997423172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,balanced,0.06039466460545858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,8,power_law_1.2,0.19313280582427977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,balanced,0.0612960010766983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,balanced,0.09860799709955852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,balanced,0.060959999759991966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,8,power_law_1.2,0.251692795753479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,balanced,0.09885866443316142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,balanced,0.061850666999816895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,balanced,0.062368000547091164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,8,power_law_1.2,0.3589567899703979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,balanced,0.1034346620241801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,balanced,0.06356800099213918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,balanced,0.06363733112812042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,8,power_law_1.2,0.5371327877044678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,balanced,0.06457066535949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,balanced,0.11341333389282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,8,power_law_1.2,0.7639359951019287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,balanced,0.06640000144640605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,8,power_law_1.2,0.9003007888793946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,balanced,0.07060266534487407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,balanced,0.13341866930325827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,balanced,0.07157333195209503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,8,power_law_1.2,1.2261568069458009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,balanced,0.07372266550858815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,8,power_law_1.2,2.011071968078613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,balanced,0.077674667040507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,balanced,0.13424000144004822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,8,power_law_1.2,5.280185699462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,balanced,0.0820906658967336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,balanced,0.09447999795277913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,balanced,0.20028799772262573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,balanced,0.10356799761454265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,balanced,0.12402133146921794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,balanced,0.029487999776999157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,balanced,0.2090346614519755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,balanced,0.029253333806991577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.07218559980392455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,balanced,0.14106667041778564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,balanced,0.029279999434947968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.053260797262191774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,balanced,0.03728000074625015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,balanced,0.05346666773160299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,balanced,0.05470933516820272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,balanced,0.19858666261037192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.06097279787063599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,balanced,0.29093867540359497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,balanced,0.055445333321889244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,balanced,0.05519466598828634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.07342720031738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,balanced,0.0558186670144399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.0782975971698761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,balanced,0.05639466643333435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,balanced,0.22899200518925986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.07466239929199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.04533120095729828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,balanced,0.057162667314211525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.07907840013504028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,balanced,0.05820266902446747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.04475519955158234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.08328319787979126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,balanced,0.058549334605534874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.049670401215553286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,balanced,0.059445331494013466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.08489599823951721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,balanced,0.329370657602946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.05565440058708191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.08528640270233154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.05986559987068176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,balanced,0.32018133004506427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.08855040073394775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.060121601819992064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.09675520062446594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.06087039709091187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,balanced,0.06401599943637848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.09789440035820007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.06133120059967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.10228480100631714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,balanced,0.06419733166694641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.06506879925727845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.10885119438171387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.0637440025806427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.11588480472564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.13868160247802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,balanced,0.4124106566111247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,balanced,0.3931359847386678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.16673920154571534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.2256704092025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.06939520239830017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.33799679279327394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.07534080147743225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.08140799999237061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.3281280040740967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.08334720134735107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,balanced,0.06793599824110667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.01,0.44136958122253417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.09835519790649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,balanced,0.07377600173155467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.01,0.47511677742004393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.11681920289993286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.01,0.8021120071411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,balanced,0.07513600091139476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.14871679544448851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,balanced,0.48518399397532147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.01,0.9743231773376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.15851520299911498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.21458559036254882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.01,1.166163158416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.28501760959625244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.05004159808158874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.01,2.195743942260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,balanced,0.08699199557304382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.3506943941116333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.056806397438049314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,power_law_1.01,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.06373760104179382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,balanced,0.634496013323466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,0.4638207912445068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.01,3.928339385986328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,balanced,0.09268266956011455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.06647040247917176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,power_law_1.01,0.04062080085277557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,0.6196415901184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.07568640112876893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.07841920256614685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,power_law_1.01,0.035750401020050046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,0.8133760452270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,balanced,0.11732799808184306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.0809664011001587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,power_law_1.01,0.04352000057697296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.08203520178794861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.01,1.0700927734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.07960320115089417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,power_law_1.01,0.04933120012283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.01,1.8221439361572265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,balanced,0.1325226624806722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.2269376039505005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,power_law_1.01,0.0523904025554657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.23322880268096924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.5198592185974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.01,3.7249473571777343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.09879040122032165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,power_law_1.01,0.05504639744758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.1048192024230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,balanced,0.1766773263613383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,power_law_1.01,0.05960320234298706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,balanced,0.7507359981536865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.1091647982597351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,power_law_1.01,0.058208000659942624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.12237440347671509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,power_law_1.01,0.06268799901008607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.13728640079498292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,power_law_1.01,0.06564480066299438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.15419520139694215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,balanced,0.22334933280944824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.18711040019989014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,power_law_1.01,0.0643392026424408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.2684351921081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,power_law_1.01,0.07549440264701843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.4051328182220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,32,power_law_1.2,0.4293504238128662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,32,power_law_1.2,0.5825791835784913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,power_law_1.01,0.07758079767227173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,32,power_law_1.2,0.8360896110534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,power_law_1.01,0.08076800107955932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,32,power_law_1.2,1.3537535667419434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,32,power_law_1.2,1.524294376373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,32,power_law_1.2,2.26190071105957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,power_law_1.01,0.08446080088615418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,balanced,0.34242133299509686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,32,power_law_1.2,3.626847839355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,power_law_1.01,0.10296319723129273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.01,0.1238144040107727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,power_law_1.2,10.568870544433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.01,0.1487936019897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,32,balanced,1.2063039938608806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.01,0.18229119777679442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.01,0.2662208080291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.01,0.3737472057342529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,balanced,0.442848006884257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.01,0.5378367900848389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.01,0.6618112087249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.01,1.0615872383117675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.03734399974346161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.01,1.2519871711730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.04229759871959686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,balanced,1.447098731994629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.0493120014667511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,power_law_1.01,1.8199871063232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.04385280013084412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,balanced,0.5650240182876587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,power_law_1.01,2.9025344848632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.05975679755210876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.0587007999420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,power_law_1.01,5.611788940429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.06095359921455383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.06291840076446534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.0644927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.06234239935874939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.06761599779129028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.07356160283088684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.07222399711608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.08122239708900451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,balanced,0.8756213188171387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.08688639998435974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.0847104012966156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.10935039520263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.12138880491256714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.1648319959640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.18588800430297853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.2500288009643555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.29971840381622317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,0.45157761573791505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,0.5874944210052491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,1.0424320220947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,1.120729637145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,32,power_law_1.2,1.6822463989257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,32,power_law_1.2,2.5727359771728517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,32,power_law_1.2,6.923808288574219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,balanced,1.7293012936909993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,32,power_law_1.2,0.050457602739334105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,32,power_law_1.2,0.036671999096870425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,32,power_law_1.2,0.037036800384521486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,balanced,0.037231999138991036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,32,power_law_1.2,0.04425599873065948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,balanced,0.03608000030120214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,32,power_law_1.2,0.04611839950084686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,balanced,0.042303999265034996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,balanced,0.05583466589450836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,32,power_law_1.2,0.05419520139694214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,balanced,0.08184533317883809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,balanced,0.07435733576615651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,32,power_law_1.2,0.05553280115127564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,balanced,0.07513066629568736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,32,power_law_1.2,0.05555199980735779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,balanced,0.07985599835713704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,32,power_law_1.2,0.05989760160446167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,balanced,0.07996266583601634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,32,power_law_1.2,0.06079360246658325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,balanced,0.08010666569073994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,balanced,0.0811359981695811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,32,power_law_1.2,0.06159359812736511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,balanced,0.08141866823037465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,32,power_law_1.2,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,balanced,0.0824533353249232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,32,power_law_1.2,0.0682752013206482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,balanced,0.08823466300964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,32,power_law_1.2,0.07678080201148987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,balanced,0.09190932909647624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,balanced,0.09237333138783772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,32,power_law_1.2,0.08435840010643006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,balanced,0.09442666172981262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,32,power_law_1.2,0.09140480160713196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,balanced,0.09802132844924927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,balanced,0.10261332988739014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,balanced,0.0348693331082662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,32,power_law_1.2,0.0893887996673584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,balanced,0.11026666561762492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,balanced,0.0349386657277743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,32,power_law_1.2,0.11909120082855225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,balanced,0.03496533383925756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.2,0.1472640037536621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,balanced,0.12241066495577495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,balanced,0.04038933416207632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,balanced,0.059114664793014526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,balanced,0.06065066655476888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.2,0.17055360078811646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,balanced,0.14334932963053384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,balanced,0.061797335743904114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,balanced,0.06121600170930227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.2,0.1892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,balanced,0.06208533545335134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.2,0.32490880489349366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,balanced,0.0631573349237442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,balanced,0.028346667687098186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,balanced,0.1476853291193644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,balanced,0.0639519989490509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.2,0.4038976192474365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,balanced,0.06319466729958852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,balanced,0.028250666956106823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.2,0.760537576675415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,balanced,0.029711998999118805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,balanced,0.06595199803511302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.2,0.8842559814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,balanced,0.03602133442958196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,balanced,0.2158986727396647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,balanced,0.0711839993794759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,balanced,0.05400000015894572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,balanced,0.0714026689529419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,balanced,0.05540800094604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,balanced,0.0746666689713796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.2,1.5892736434936523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,balanced,0.05641599992911021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,balanced,0.08065600196520488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,balanced,0.0558186670144399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.2,2.202867126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,balanced,0.08597866694132487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.01,0.07352960109710693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,balanced,0.2390026648839315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,balanced,0.05677333474159241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.01,0.055327999591827395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,32,power_law_1.2,2.9610048294067384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,balanced,0.09666132926940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,balanced,0.05755733450253805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.01,0.063264000415802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.01,0.04405759871006012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,balanced,0.05796800057093302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.01,0.04984320104122162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.01,0.03733760118484497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,32,power_law_1.2,6.117292785644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,balanced,0.10714667042096455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,balanced,0.058970664938290916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.01,0.05912320017814636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.01,0.041503998637199405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.01,0.06352000236511231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,balanced,0.05990933378537496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.01,0.07124480009078979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.01,0.047091200947761536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,32,power_law_1.2,11.11492462158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,balanced,0.13612799843152365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,balanced,0.06131199995676676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.01,0.07537919878959656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,balanced,0.3365226586659749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.01,0.058220797777175905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.01,0.07820799946784973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.01,0.05985280275344849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.01,0.08020480275154114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,balanced,0.1546026666959127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.01,0.060134398937225345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.01,0.0807424008846283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.01,0.08367999792098998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,balanced,0.06628799935181935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.01,0.08831359744071961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.01,0.06155520081520081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.01,0.09471359848976135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,balanced,0.0673173318306605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,balanced,0.2176213264465332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.01,0.06390399932861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.01,0.0936191976070404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.01,0.10156799554824829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.01,0.06522240042686463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,balanced,0.3912159999211629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.01,0.1051584005355835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.01,0.06449919939041138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.01,0.10725760459899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.01,0.06692479848861695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.01,0.11927679777145386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,balanced,0.2627039949099223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.01,0.13485440015792846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.01,0.07609599828720093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.01,0.14826879501342774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,balanced,0.07164266705513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.01,0.07932159900665284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.01,0.2148736000061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.01,0.08548480272293091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.01,0.30222721099853517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,balanced,0.08027733365694682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.01,0.09379199743270875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.01,0.25594239234924315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.01,0.10559999942779541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.01,0.3507711887359619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,balanced,0.08271466692288716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.01,0.12983039617538453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.01,0.4280831813812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,balanced,0.3760693470637004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.01,0.6223040103912354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.01,0.14313600063323975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,balanced,0.49411733945210773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.01,0.21276800632476806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.01,0.888326358795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.01,0.235315203666687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.01,0.9864704132080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,balanced,0.09912533561388652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.01,0.31239678859710696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.01,1.5415743827819823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.01,0.4630335807800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,balanced,0.10868799686431885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.01,3.911577606201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.01,0.5668608188629151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.01,0.852723217010498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,balanced,0.14433599511782327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.01,0.9332991600036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,balanced,0.4635733366012573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.01,1.556492805480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,balanced,0.1697546641031901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.01,3.6408767700195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,power_law_1.01,0.05386880040168762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,balanced,0.24708799521128336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,power_law_1.01,0.03739520013332367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,balanced,0.7503413359324137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,power_law_1.01,0.03199360072612763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,16,power_law_1.2,0.07347840070724487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,power_law_1.01,0.04254080057144165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,16,power_law_1.2,0.045023998618125914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,balanced,0.5745919942855835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,balanced,0.3217653234799703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,power_law_1.01,0.04490239918231964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,16,power_law_1.2,0.04929920136928558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,power_law_1.01,0.053907197713851926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,16,power_law_1.2,0.05194240212440491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,power_law_1.01,0.0564736008644104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,16,power_law_1.2,0.06027519702911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,power_law_1.01,0.057017600536346434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,16,power_law_1.2,0.06995840072631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,power_law_1.01,0.05628160238265991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,16,power_law_1.2,0.07334399819374085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,16,power_law_1.2,0.07562239766120911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,power_law_1.01,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,16,power_law_1.2,0.07861760258674622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,power_law_1.01,0.06229119896888733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,16,power_law_1.2,0.08225280046463013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,power_law_1.01,0.06544640064239501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,balanced,0.4764639933904012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,16,power_law_1.2,0.08561919927597046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,power_law_1.01,0.06627839803695679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,16,power_law_1.2,0.0911679983139038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,power_law_1.01,0.07486720085144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,16,power_law_1.2,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,16,power_law_1.2,0.10002559423446655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,balanced,0.8680799802144369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,power_law_1.01,0.08078719973564148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,16,power_law_1.2,0.10375039577484131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,power_law_1.01,0.07925119996070862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,16,power_law_1.2,0.1095039963722229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,balanced,0.6072959899902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,16,power_law_1.2,0.10835839509963989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,16,power_law_1.2,0.13256319761276245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,power_law_1.01,0.08606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,power_law_1.01,0.0991104006767273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,16,power_law_1.2,0.14094719886779786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,power_law_1.01,0.12083200216293336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,16,power_law_1.2,0.17793920040130615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,16,power_law_1.2,0.19868160486221315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,balanced,1.4588534037272136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,power_law_1.01,0.1481727957725525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,16,power_law_1.2,0.3326783895492554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,power_law_1.01,0.17138559818267823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,16,power_law_1.2,0.33228800296783445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,power_law_1.01,0.29113600254058836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,16,power_law_1.2,0.463699197769165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,balanced,0.7686399618784586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,power_law_1.01,0.3907455921173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,16,power_law_1.2,0.5144832134246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,power_law_1.01,0.4670720100402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,16,power_law_1.2,0.8141375541687011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,power_law_1.01,0.6731520175933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,16,power_law_1.2,1.3173888206481934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,power_law_1.01,0.9572480201721192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,16,power_law_1.2,1.883967971801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,power_law_1.01,1.2070015907287597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,16,power_law_1.2,2.832588768005371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,power_law_1.01,1.7190208435058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,16,power_law_1.2,6.768831634521485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,power_law_1.01,2.6476287841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,power_law_1.01,5.564563369750976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,balanced,1.2018240292867024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,balanced,1.693738619486491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,16,power_law_1.2,0.058406400680541995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,16,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,16,power_law_1.2,0.036646398901939395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,16,power_law_1.2,0.040115201473236085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,16,power_law_1.2,0.05148800015449524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,16,power_law_1.2,0.05875840187072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,16,power_law_1.2,0.060166400671005246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,16,power_law_1.2,0.06101760268211365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,16,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,16,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,16,power_law_1.2,0.06268159747123718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,16,power_law_1.2,0.06446080207824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,16,power_law_1.2,0.07006719708442688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,16,power_law_1.2,0.07087360024452209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,16,power_law_1.2,0.07786880135536194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,16,power_law_1.2,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,16,power_law_1.2,0.08364160060882568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,16,power_law_1.2,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,16,power_law_1.2,0.1108288049697876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,16,power_law_1.2,0.13116159439086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,balanced,2.3771467208862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,16,power_law_1.2,0.16584320068359376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,16,power_law_1.2,0.22624640464782714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,balanced,0.03403733422358831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,16,power_law_1.2,0.29409921169281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,balanced,0.03882133215665817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,16,power_law_1.2,0.39555199146270753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,balanced,0.03869866579771042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,16,power_law_1.2,0.4893184185028076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,16,power_law_1.2,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,balanced,0.056048000852266945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,16,power_law_1.2,0.8092608451843262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,16,power_law_1.2,0.03219200074672699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,balanced,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,16,power_law_1.2,1.1270719528198243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,16,power_law_1.2,0.03284479975700379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,balanced,0.0835040012995402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,16,power_law_1.2,1.580198383331299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,16,power_law_1.2,0.03674240112304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,balanced,0.08462933699289958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,16,power_law_1.2,0.04653440117835998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,16,power_law_1.2,2.016755294799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,balanced,0.08159466584523518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,balanced,0.08098666866620381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,16,power_law_1.2,0.05459200143814087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,16,power_law_1.2,5.532563018798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,16,power_law_1.2,0.05556480288505554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,balanced,0.08214400211970012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,16,power_law_1.2,0.056032001972198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,balanced,0.08161066472530365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,16,power_law_1.2,0.060192000865936277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,16,power_law_1.2,0.06104320287704468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,balanced,0.08410132924715678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,16,power_law_1.2,0.0652671992778778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,balanced,0.08366400003433228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,16,power_law_1.2,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,balanced,0.08964799841245015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,balanced,0.09451733032862346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,16,power_law_1.2,0.07022719979286193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,balanced,0.09629866480827332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,16,power_law_1.2,0.0754688024520874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,balanced,0.09828266501426697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,balanced,0.10501333077748616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,16,power_law_1.2,0.08233600258827209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,balanced,0.11173333724339803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,16,power_law_1.2,0.09070079922676086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,balanced,0.12446932991345723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,balanced,0.13434666395187378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,16,power_law_1.2,0.0907904028892517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,16,power_law_1.2,0.11568000316619872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,16,power_law_1.2,0.1376960039138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,balanced,0.1704746683438619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,balanced,0.03305066625277201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,16,power_law_1.2,0.1614527940750122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,balanced,0.181877334912618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,16,power_law_1.2,0.24404480457305908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,balanced,0.034341332813103996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,16,power_law_1.2,0.35917439460754397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,balanced,0.03493333359559377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,16,power_law_1.2,0.4389056205749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,balanced,0.04131733377774557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,balanced,0.26557334264119464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,balanced,0.05910933514436086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,16,power_law_1.2,0.7732927799224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,balanced,0.061103999614715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,16,power_law_1.2,0.9312576293945313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,balanced,0.0620959997177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,balanced,0.062224000692367554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,16,power_law_1.2,1.148140811920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,balanced,0.3046560088793437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,balanced,0.06259199976921082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,16,power_law_1.2,1.9311359405517579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,balanced,0.06340266764163971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,balanced,0.06550399959087372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,16,power_law_1.2,2.377280044555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,16,power_law_1.2,5.071104049682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,balanced,0.06669866542021434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,balanced,0.06763199965159099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,balanced,0.4356906811396281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,16,power_law_1.2,9.971968078613282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,balanced,0.07434666653474171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,balanced,0.07467733323574066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.01,0.04019840061664581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.01,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,balanced,0.08046400050322215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.01,0.03722879886627197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.01,0.04615040123462677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,balanced,0.08705066641171773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.01,0.036025598645210266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.01,0.042956799268722534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.01,0.05370240211486817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.01,0.043750399351119997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,balanced,0.09297066926956177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.01,0.05856639742851257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.01,0.049497601389884946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.01,0.07747840285301208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,balanced,0.10739200313886006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,balanced,0.02916266769170761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,balanced,0.5186560153961182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.01,0.08051199913024902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.01,0.05783680081367493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.01,0.07811840176582337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,balanced,0.030080000559488933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.01,0.058336001634597776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,balanced,0.11983999609947205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.01,0.07824000120162963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,balanced,0.030954666435718536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.01,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.01,0.08330879807472229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.01,0.08491520285606384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.01,0.06093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,balanced,0.1590506633122762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.01,0.08662400245666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.01,0.062080001831054686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.01,0.08642560243606567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,balanced,0.05699199934800466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.01,0.08835840225219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.01,0.06368640065193176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.01,0.10295679569244384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,balanced,0.05842133363087972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.01,0.06956160068511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,balanced,0.18588799238204956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.01,0.10417280197143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.01,0.07299839854240417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,balanced,0.05778666834036509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.01,0.10825599431991577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.01,0.12345600128173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,balanced,0.060517330964406334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.01,0.07400320172309875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.01,0.13889919519424437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,balanced,0.6590720017751058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,balanced,0.06025066475073496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.01,0.0778432011604309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,balanced,0.2670560081799825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.01,0.1600640058517456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,balanced,0.06122133135795593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.01,0.08439040184020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.01,0.17863039970397948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,balanced,0.06248533229033152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.01,0.25157120227813723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.01,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.01,0.2543423891067505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.01,0.1035264015197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,balanced,0.06398933132489522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.01,0.36428160667419435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.01,0.11496959924697876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,balanced,0.06628266473611195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.01,0.4394495964050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,balanced,0.3301706711451213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.01,0.12902400493621827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.01,0.6494527816772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.01,0.15701119899749755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.01,0.8194047927856445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.01,0.21843841075897216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.01,0.9576191902160645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.01,0.249619197845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,balanced,0.07349333167076111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.01,1.6503871917724608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.01,0.35223679542541503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,balanced,0.07468800246715546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.01,3.5158206939697267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.01,0.43084158897399905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,balanced,0.4771893421808879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.01,0.6372096061706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.01,0.8660863876342774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.01,0.9825984001159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,balanced,0.9772266546885172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.01,1.880076789855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,balanced,0.0831413318713506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,power_law_1.01,0.03923200070858002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,balanced,0.09546132882436116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.01,3.4216575622558594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,power_law_1.01,0.033267199993133545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,balanced,0.09922666351000468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,balanced,0.6007573207219442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,power_law_1.01,0.0347135990858078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,power_law_1.01,0.04048640131950378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,power_law_1.01,0.045926401019096376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,balanced,0.12459733088811238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,power_law_1.01,0.058323198556900026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,power_law_1.01,0.058316802978515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,power_law_1.01,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,balanced,0.14193066954612732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,power_law_1.01,0.061478400230407716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,power_law_1.01,0.06407679915428162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,power_law_1.01,0.06789759993553161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,balanced,0.2150826652844747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,power_law_1.01,0.0742464005947113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,balanced,0.7567306359608968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,power_law_1.01,0.0770367980003357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,8,power_law_1.2,0.0525056004524231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,balanced,0.26410667101542157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,8,power_law_1.2,0.04296959936618805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,power_law_1.01,0.08737279772758484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,8,power_law_1.2,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,power_law_1.01,0.09129599928855896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,8,power_law_1.2,0.05018240213394165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,8,power_law_1.2,0.05331839919090271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,balanced,0.3766239881515503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,8,power_law_1.2,0.07580800056457519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,power_law_1.01,0.09957759976387023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,8,power_law_1.2,0.08080000281333924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,power_law_1.01,0.12200319766998291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,8,power_law_1.2,0.07859839797019959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,power_law_1.01,0.13619840145111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,8,power_law_1.2,0.07989119887351989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,8,power_law_1.2,0.08239359855651855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,power_law_1.01,0.1710911989212036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,balanced,0.4850240151087443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,power_law_1.01,0.22574079036712646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,8,power_law_1.2,0.08398720026016235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,power_law_1.01,0.31496319770812986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,8,power_law_1.2,0.08684160113334656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,power_law_1.01,0.41792001724243166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,8,power_law_1.2,0.08901119828224183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,power_law_1.01,0.6275455951690674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,8,power_law_1.2,0.09567360281944275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,power_law_1.01,0.7839807987213134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,balanced,1.90449062983195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,8,power_law_1.2,0.1031872034072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,balanced,1.1183946927388508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,power_law_1.01,1.2354240417480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,8,power_law_1.2,0.10800000429153442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,balanced,0.7090293566385905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,power_law_1.01,1.5348416328430177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,8,power_law_1.2,0.11415679454803467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,power_law_1.01,1.813523292541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,8,power_law_1.2,0.12654720544815062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,8,power_law_1.2,0.14596480131149292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,power_law_1.01,2.88342399597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,8,power_law_1.2,0.1592128038406372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,8,power_law_1.2,0.19866880178451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,power_law_1.01,6.034675216674804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,8,power_law_1.2,0.28092160224914553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,8,power_law_1.2,0.2864000082015991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,balanced,0.9243093331654867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,8,power_law_1.2,0.4254271984100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,8,power_law_1.2,0.5399871826171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,8,power_law_1.2,0.7529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,8,power_law_1.2,1.1107263565063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,8,power_law_1.2,1.3614015579223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,8,power_law_1.2,2.2814847946166994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,8,power_law_1.2,5.439686584472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,8,power_law_1.2,0.03710080087184906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,balanced,1.1668372948964436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,8,power_law_1.2,0.03447679877281189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,8,power_law_1.2,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,8,power_law_1.2,0.04140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,8,power_law_1.2,0.04545280039310455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,8,power_law_1.2,0.05839359760284424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,8,power_law_1.2,0.05950719714164734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,8,power_law_1.2,0.061862397193908694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,8,power_law_1.2,0.05999360084533691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,balanced,2.213343938191732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,8,power_law_1.2,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,8,power_law_1.2,0.06540799736976624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,8,power_law_1.2,0.07049599885940552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,8,power_law_1.2,0.07303040027618408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,8,power_law_1.2,0.07402240037918091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,8,power_law_1.2,0.08123520016670227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,balanced,1.8295733133951824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,8,power_law_1.2,0.08429440259933471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,8,power_law_1.2,0.09345920085906982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,8,power_law_1.2,0.10060160160064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,8,power_law_1.2,0.11651840209960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,8,power_law_1.2,0.13500800132751464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,8,power_law_1.2,0.1665984034538269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,8,power_law_1.2,0.23594241142272948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,8,power_law_1.2,0.2896320104598999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,8,power_law_1.2,0.4036287784576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,8,power_law_1.2,0.554969596862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,8,power_law_1.2,0.9104191780090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,8,power_law_1.2,1.069696044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,8,power_law_1.2,1.2698176383972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,8,power_law_1.2,2.5319168090820314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,8,power_law_1.2,4.949728012084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,balanced,0.03585066646337509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,balanced,0.03888533264398575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,balanced,0.0432533323764801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,balanced,0.058176000912984215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,8,power_law_1.2,0.03937920033931732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,balanced,0.07995200157165527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,8,power_law_1.2,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,balanced,0.0811466674009959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,8,power_law_1.2,0.033907198905944826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,balanced,0.08131200075149536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,8,power_law_1.2,0.039238399267196654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,balanced,0.08237333099047343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,8,power_law_1.2,0.04681600034236908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,balanced,0.08255999783674876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,8,power_law_1.2,0.05820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,balanced,0.0825973351796468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,8,power_law_1.2,0.05857920050621033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,balanced,0.08540266752243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,balanced,3.6169811884562173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,balanced,0.08592533071835835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,8,power_law_1.2,0.06120319962501526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,balanced,0.08678399523099263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,8,power_law_1.2,0.06261119842529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,8,power_law_1.2,0.06268159747123718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,balanced,0.09008000294367473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,8,power_law_1.2,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,balanced,0.09666666388511658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,8,power_law_1.2,0.07259520292282104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,balanced,0.10008533795674641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,8,power_law_1.2,0.07393919825553893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,balanced,0.1092639962832133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,8,power_law_1.2,0.08090239763259888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,balanced,0.11988266309102376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,balanced,0.12457066774368286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,8,power_law_1.2,0.08711680173873901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,8,power_law_1.2,0.09479680061340331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,balanced,0.14072533448537192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,balanced,0.1604266663392385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,8,power_law_1.2,0.10115200281143188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,8,power_law_1.2,0.13175040483474731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,balanced,0.22030933698018393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,balanced,0.03329599897066752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,8,power_law_1.2,0.1675711989402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,balanced,0.03521066655715307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,balanced,0.03730133424202601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,8,power_law_1.2,0.21303040981292726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,balanced,0.2600746750831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,balanced,0.0470719983180364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,8,power_law_1.2,0.2539968013763428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,balanced,0.06423466900984447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,balanced,0.06610133250554402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,8,power_law_1.2,0.3921792030334473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,balanced,0.06720533470312755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,8,power_law_1.2,0.5323520183563233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,balanced,0.36285332838694256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,balanced,0.0672266681989034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,8,power_law_1.2,0.687391996383667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,balanced,0.06764266888300578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,balanced,0.0683840016523997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,8,power_law_1.2,1.1447999954223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,balanced,0.06804800033569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,8,power_law_1.2,1.5677824020385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,balanced,0.07027733325958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,balanced,0.07177066802978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,balanced,0.45470933119455975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,8,power_law_1.2,2.073388862609863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,balanced,0.07469333211580913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,balanced,0.0828906645377477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,8,power_law_1.2,3.0044479370117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,balanced,0.08323733508586884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,8,power_law_1.2,4.18326416015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,balanced,0.09177600344022115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,balanced,0.10187199711799622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,8,power_law_1.2,9.464128112792968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,balanced,0.03442666679620743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,balanced,0.6642613410949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,balanced,0.10870400071144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,balanced,0.03544000039498011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,balanced,0.03711466739575068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.01,0.041356799006462094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,balanced,0.12826133767763773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,balanced,0.04618666569391886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.01,0.04296959936618805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,balanced,0.06274666885534923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,balanced,0.14757333199183145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,balanced,0.06525866687297821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.01,0.04255360066890716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,balanced,0.06643199920654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.01,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,balanced,0.20593067010243735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,balanced,0.06705600023269653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.01,0.058355200290679934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,balanced,0.06794133285681407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,balanced,0.8232159614562988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,balanced,0.06980800131956737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.01,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,balanced,0.2513226668039958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,balanced,0.07099199791749318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.01,0.07425919771194459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,balanced,0.07402133444945018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,balanced,0.07673599819342296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.01,0.07523840069770812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,balanced,0.0795253316561381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.01,0.08081279993057251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,balanced,0.372869332631429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.01,0.08173440098762512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.01,0.08725759983062745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.01,0.08883839845657349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.01,0.03640320003032684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.01,0.09258880019187928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,balanced,0.09124267101287842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.01,0.03495680093765259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.01,0.7888576030731201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,balanced,1.0326773325602214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,balanced,0.4869439999262492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,balanced,0.09223999579747517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.01,0.03787519931793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.01,0.8001343727111816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.01,0.04414080083370209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.01,0.8023488044738769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.01,0.049132800102233885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.01,0.12527999877929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.01,0.06222079992294312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.01,0.13609600067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.01,0.06242560148239136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.01,0.14531199932098388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.01,0.06566399931907654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.01,0.17938560247421265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.01,0.06752640008926392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,balanced,0.7160586516062418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,balanced,0.1070240040620168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.01,0.20703999996185302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.01,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.01,0.26023039817810056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,balanced,0.12588799993197122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.01,0.07178239822387696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.01,0.29786880016326905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.01,0.07663999795913697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,balanced,0.13407466808954874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.01,0.4217984199523926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.01,0.08097280263900757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.01,0.5447487831115723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.01,0.07926399707794189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.01,0.7948224067687988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.01,0.08807039856910706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.01,1.0334848403930663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.01,0.09641600251197815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.01,0.10585600137710571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,balanced,0.19628800948460898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.01,1.3485440254211425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,balanced,0.922538677851359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.01,0.11712000370025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,balanced,1.4946613311767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.01,2.2739200592041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.01,0.12519680261611937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,balanced,0.23896000782648721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.01,0.15402239561080933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.01,4.104403305053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.01,0.18865280151367186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.01,0.2561216115951538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,balanced,0.35736533006032306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.01,0.2970240116119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,power_law_1.01,0.03793280124664307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.01,0.4370368003845215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.01,0.5502783775329589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,balanced,0.43541868527730304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,power_law_1.01,0.035692799091339114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.01,0.8215359687805176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,power_law_1.01,0.038726401329040525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.01,1.1358976364135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,power_law_1.01,0.04506880044937134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,balanced,1.1563999652862549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.01,1.3722304344177245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,balanced,0.6270773410797119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,power_law_1.01,0.04933759868144989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.01,2.1174144744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,power_law_1.01,0.0627135992050171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,power_law_1.01,0.06462079882621766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.01,4.711500930786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,power_law_1.01,0.06703360080718994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,balanced,0.8123040199279785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,power_law_1.01,0.0700543999671936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,power_law_1.01,0.07349119782447815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,power_law_1.01,0.07674880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,power_law_1.01,0.0810368001461029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,4,power_law_1.2,0.04101119935512543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,power_law_1.01,0.08943359851837158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,4,power_law_1.2,0.042745599150657655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,power_law_1.01,0.09500799775123596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,balanced,1.2017813523610432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,4,power_law_1.2,0.042419201135635375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,4,power_law_1.2,0.05015040040016174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,power_law_1.01,0.10662399530410767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,4,power_law_1.2,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,balanced,1.6795412699381511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,power_law_1.01,0.11619839668273926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,4,power_law_1.2,0.07035520076751708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,4,power_law_1.2,0.07390720248222352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,4,power_law_1.2,0.0800320029258728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,power_law_1.01,0.1268671989440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,balanced,2.9429279963175454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,4,power_law_1.2,0.0812287986278534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,power_law_1.01,0.1541375994682312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,balanced,1.576325257619222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,4,power_law_1.2,0.08348159790039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,power_law_1.01,0.1784127950668335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,4,power_law_1.2,0.08652160167694092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,4,power_law_1.2,0.09131519794464112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,power_law_1.01,0.2582655906677246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,4,power_law_1.2,0.0938368022441864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,power_law_1.01,0.33765759468078616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,4,power_law_1.2,0.7933055877685546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,power_law_1.01,0.4543744087219238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,4,power_law_1.2,0.7967040061950683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,power_law_1.01,0.5434751987457276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,4,power_law_1.2,0.8080448150634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,power_law_1.01,0.79617919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,4,power_law_1.2,0.12784639596939087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,balanced,1.9747999509175618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,power_law_1.01,1.0982399940490724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,4,power_law_1.2,0.14438400268554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,power_law_1.01,1.5691328048706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,4,power_law_1.2,0.16234240531921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,power_law_1.01,1.9704448699951171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,4,power_law_1.2,0.18921600580215453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,power_law_1.01,2.486777687072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,4,power_law_1.2,0.20689918994903564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,4,power_law_1.2,0.29783039093017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,power_law_1.01,4.008703994750976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,4,power_law_1.2,0.3869695901870728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,4,power_law_1.2,0.46727681159973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,power_law_1.01,9.134425354003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,4,power_law_1.2,0.642310380935669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,4,power_law_1.2,0.03644160032272339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,4,power_law_1.2,0.9033920288085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,4,power_law_1.2,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,4,power_law_1.2,0.03702400028705597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,4,power_law_1.2,1.4337727546691894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,balanced,3.3065385818481445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,4,power_law_1.2,0.044064000248909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,balanced,3.1209119160970054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,4,power_law_1.2,1.8223615646362306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,4,power_law_1.2,0.047968000173568726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,4,power_law_1.2,2.8451648712158204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,4,power_law_1.2,0.061401599645614625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,4,power_law_1.2,0.06286079883575439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,4,power_law_1.2,6.124115371704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,4,power_law_1.2,0.06507520079612732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,4,power_law_1.2,0.07154560089111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,4,power_law_1.2,0.07089279890060425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,4,power_law_1.2,0.07518079876899719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,4,power_law_1.2,0.07862399816513062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,4,power_law_1.2,0.0806656002998352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,4,power_law_1.2,0.08166400194168091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,4,power_law_1.2,0.091212797164917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,4,power_law_1.2,0.09345920085906982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,4,power_law_1.2,0.10451200008392333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,4,power_law_1.2,0.12201600074768067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,4,power_law_1.2,0.140556800365448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,4,power_law_1.2,0.16349439620971679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,4,power_law_1.2,0.19425920248031617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,4,power_law_1.2,0.2686912059783936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,4,power_law_1.2,0.32045440673828124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,4,power_law_1.2,0.4648064136505127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,4,power_law_1.2,0.6302015781402588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,4,power_law_1.2,1.009663963317871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,4,power_law_1.2,1.3212287902832032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,4,power_law_1.2,1.665043258666992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,balanced,6.187914530436198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,4,power_law_1.2,2.538355255126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,4,power_law_1.2,5.170790481567383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,4,power_law_1.2,0.0383679986000061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,4,power_law_1.2,0.0378495991230011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,4,power_law_1.2,0.03894400000572205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,balanced,0.036837334434191384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,4,power_law_1.2,0.04625920057296753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,balanced,0.04475200176239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,4,power_law_1.2,0.048281601071357726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,balanced,0.045253331462542214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,4,power_law_1.2,0.06261759996414185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,balanced,0.061808000008265175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,4,power_law_1.2,0.06528000235557556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,balanced,0.09372799595197041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,4,power_law_1.2,0.06703360080718994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,balanced,0.09405866265296936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,balanced,0.0960693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,4,power_law_1.2,0.0695360004901886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,balanced,0.09569600224494934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,4,power_law_1.2,0.07234560251235962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,balanced,0.09692800045013428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,4,power_law_1.2,0.0775871992111206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,balanced,0.09727999567985535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,4,power_law_1.2,0.08196480274200439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,balanced,0.0995306670665741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,4,power_law_1.2,0.09107840061187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,balanced,0.10338133573532104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,4,power_law_1.2,0.0974016010761261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,balanced,0.1050986647605896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,balanced,0.10949866970380147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,4,power_law_1.2,0.11165440082550049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,balanced,0.11607467134793599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,balanced,0.11912533640861511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,4,power_law_1.2,0.11915520429611207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,balanced,0.12913599610328674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,balanced,0.14520532886187235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,4,power_law_1.2,0.12681599855422973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,balanced,0.1581706702709198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,4,power_law_1.2,0.15843839645385743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,balanced,0.034671999514102936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,balanced,0.18552533785502115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,4,power_law_1.2,0.20207359790802001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,balanced,0.03625066578388214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,balanced,0.04038933416207632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,balanced,0.051776001850763954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,balanced,0.21163199345270792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,4,power_law_1.2,0.2650496006011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,balanced,0.07266666491826375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,balanced,0.07574933270613353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,4,power_law_1.2,0.33473279476165774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,balanced,0.0769760012626648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,balanced,0.29893867174784344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,4,power_law_1.2,0.5048960208892822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,balanced,0.07726933558781941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,4,power_law_1.2,0.6108479976654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,balanced,0.07945066690444946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,balanced,0.08066666622956593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,4,power_law_1.2,0.9980607986450195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,balanced,0.08025066554546356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,balanced,0.40566933155059814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,4,power_law_1.2,1.246009635925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,balanced,0.08388266960779826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,balanced,0.08508800466855367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,4,power_law_1.2,1.876095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,balanced,0.08982400099436443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,4,power_law_1.2,2.4460800170898436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,balanced,0.09894399841626485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,balanced,0.6146133343378702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,balanced,0.10237866640090942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,4,power_law_1.2,3.0376768112182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,balanced,0.11520533760388692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,balanced,0.12863999605178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,4,power_law_1.2,5.243577575683593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,balanced,0.14204800128936768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,balanced,0.8145173390706381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,4,power_law_1.2,12.098534393310548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,balanced,0.17308266957600912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,balanced,0.1996799906094869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.01,0.04510720074176788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,balanced,0.28619199991226196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.01,0.04421760141849518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.01,0.04230400025844574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,balanced,1.2121866544087727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,balanced,0.36699732144673664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.01,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.01,0.06399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.01,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,balanced,0.5879040161768595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.01,0.08940799832344055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.01,0.035392001271247864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.01,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.01,0.09366400241851806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.01,0.03535360097885132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.01,0.09459840059280396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,balanced,1.6217494010925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.01,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.01,0.10278400182723998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,balanced,0.7812746365865072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.01,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.01,0.1155135989189148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.01,0.05204480290412903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.01,0.11665279865264892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.01,0.06680960059165955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.01,0.12294399738311768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.01,0.07008000016212464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.01,0.1348031997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.01,0.07292799949645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.01,0.13395839929580688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.01,0.0794431984424591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,balanced,1.1695786317189534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.01,0.13472000360488892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.01,0.08020480275154114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.01,0.17679359912872314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.01,0.0811456024646759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.01,0.20480639934539796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,balanced,2.0291573206583657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.01,0.09208959937095643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.01,0.09685119986534119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.01,0.236678409576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.01,0.09825279712677001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.01,0.27192959785461424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.01,0.10785919427871704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.01,0.3484544038772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.01,0.11285760402679443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.01,0.4421696186065674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,balanced,1.4358720779418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.01,0.12735359668731688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.01,0.6298816204071045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.01,0.14377599954605103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.01,0.16397440433502197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.01,0.7885183811187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.01,0.19562239646911622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.01,1.2303359985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.01,0.25192320346832275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.01,1.831590461730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.01,0.323744010925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,2,power_law_1.2,0.04467200040817261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.01,0.41059198379516604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.01,2.2135488510131838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,2,power_law_1.2,0.04099839925765991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.01,0.5716351985931396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.01,3.3013057708740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,2,power_law_1.2,0.04211199879646301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.01,0.7895103931427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,balanced,1.8011786142985027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,2,power_law_1.2,0.051948797702789304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,balanced,2.8253758748372397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.01,1.2393152236938476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.01,6.819519805908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,2,power_law_1.2,0.061900800466537474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.01,1.6033344268798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,2,power_law_1.2,0.08701440095901489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.01,1.9601215362548827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,2,power_law_1.2,0.09030399918556213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.01,3.3404991149902346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,2,power_law_1.2,0.09033600091934205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,2,power_law_1.2,0.09580159783363343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.01,6.310879898071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,2,power_law_1.2,0.09438719749450683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,2,power_law_1.2,0.1028607964515686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,2,power_law_1.2,0.11255680322647095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,2,power_law_1.2,0.12301440238952636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,2,power_law_1.2,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,2,power_law_1.2,0.13296639919281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,balanced,2.8234294255574546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,2,power_law_1.2,0.14101120233535766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,2,power_law_1.2,0.14481279850006104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,2,power_law_1.2,0.18487679958343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,2,power_law_1.2,0.21232640743255615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,2,power_law_1.2,0.23372159004211426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,2,power_law_1.2,0.2739264011383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,2,power_law_1.2,0.3532991886138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,2,power_law_1.2,0.4642240047454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,2,power_law_1.2,0.6404287815093994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,2,power_law_1.2,0.8818559646606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,2,power_law_1.2,1.2759552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,2,power_law_1.2,1.9122175216674804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,2,power_law_1.2,2.3471168518066405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,balanced,5.665274937947591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,2,power_law_1.2,3.7611457824707033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,2,power_law_1.2,7.334912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,balanced,5.63047981262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,2,power_law_1.2,0.03553920090198517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,2,power_law_1.2,0.03530240058898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,2,power_law_1.2,0.037964800000190736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,2,power_law_1.2,0.046003198623657225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,2,power_law_1.2,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,2,power_law_1.2,0.06846719980239868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,2,power_law_1.2,0.07091839909553528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,2,power_law_1.2,0.07771520018577575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,2,power_law_1.2,0.08085119724273682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,2,power_law_1.2,0.08429440259933471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,2,power_law_1.2,0.08523520231246948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,2,power_law_1.2,0.0945472002029419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,2,power_law_1.2,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,2,power_law_1.2,0.09937279820442199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,2,power_law_1.2,0.10830080509185791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,2,power_law_1.2,0.11436159610748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,2,power_law_1.2,0.1272704005241394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,2,power_law_1.2,0.14647040367126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,2,power_law_1.2,0.16676479578018188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,2,power_law_1.2,0.2041152000427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,2,power_law_1.2,0.2560447931289673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,2,power_law_1.2,0.3347584009170532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,2,power_law_1.2,0.4464896202087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,2,power_law_1.2,0.6264448165893555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,2,power_law_1.2,0.8575360298156738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,2,power_law_1.2,1.3279232025146483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,2,power_law_1.2,1.7320703506469726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,2,power_law_1.2,2.1231231689453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,2,power_law_1.2,3.846227264404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,2,power_law_1.2,6.874470520019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,balanced,0.039546666045983635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,balanced,0.04925866425037384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,balanced,0.05665066838264465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,balanced,0.0758240024248759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,balanced,0.10631466905275981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,balanced,0.11401066184043884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,balanced,0.11591466267903645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,balanced,0.11584533254305522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,balanced,0.11838933825492859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,balanced,0.1202186644077301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,balanced,0.037445334096749626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,balanced,0.12408533692359924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,balanced,0.045370668172836304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,balanced,0.12777066230773926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,balanced,0.049600000182787575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,balanced,0.1311840017636617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,balanced,0.06835199892520905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,balanced,0.1344266633192698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,balanced,0.09852799773216248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,balanced,0.10193600257237752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,balanced,0.14134933551152548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,balanced,0.10243200262387593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,balanced,0.14730667074521384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,balanced,0.10414933164914449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,balanced,0.16879467169443765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,balanced,0.10758933424949646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,balanced,0.20302400986353555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,balanced,0.10771200060844421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,balanced,0.1102133293946584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,balanced,0.21595199902852377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,balanced,0.1134986678759257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,balanced,0.11716266473134358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,balanced,0.26554665962855023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,balanced,0.1264533301194509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,balanced,0.13710932930310568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.03743999898433685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,balanced,0.3051519989967346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,balanced,0.1457919975121816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,balanced,0.1702186663945516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.039647999405860904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,balanced,0.20202134052912393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.05059840083122254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,balanced,0.4720160166422526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,balanced,0.2163146734237671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.07155200242996215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,balanced,0.27155200640360516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.10172159671783447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,balanced,0.5890133380889893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.10552959442138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.01,0.03566080033779144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,balanced,0.31973334153493244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.11137919425964356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.01,0.039238399267196654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.11759359836578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,balanced,0.4736959934234619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,balanced,0.9688159624735514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.12357759475708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.01,0.05880320072174072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.01,0.06459519863128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.13426560163497925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,balanced,0.6038506825764974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.01,0.08899840116500854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.01,0.0943231999874115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.13831679821014403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.01,0.09683840274810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.13590400218963622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,balanced,1.3145546913146973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.01,0.09995520114898682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,balanced,0.9886240164438883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.14810240268707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.01,0.10378880500793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.01,0.11752320528030395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.15815680027008056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.01,0.12403839826583862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.17530239820480348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.01,0.130457603931427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.22922239303588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,balanced,1.3632747332255046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.01,0.13587839603424073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.23196799755096437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,balanced,1.9737013181050618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.01,0.15219199657440186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.3083712100982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.01,0.1634112000465393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.3603584051132202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.01,0.18644479513168336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.4759552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.01,0.22144639492034912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.6155648231506348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.01,0.2445120096206665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,balanced,2.1009546915690103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.9008576393127441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.01,0.3075200080871582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.01,1.2002047538757323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.01,0.37650558948516843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.01,1.8286783218383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,balanced,2.421610673268636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.01,0.5147327899932861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.01,2.3549503326416015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.01,0.6390592098236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.01,2.9547391891479493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.01,0.9360575675964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.01,1.2668224334716798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.01,5.085548782348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.01,1.9676223754882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,balanced,2.7957547505696616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.01,2.6588544845581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.01,10.11599349975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.01,3.372639846801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.01,5.31673583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,balanced,3.0372746785481772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.01,10.824492645263671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,balanced,3.5252691904703775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.04010240137577057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,1,power_law_1.2,0.03575679957866669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.04618239998817444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,balanced,4.775850613911946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,1,power_law_1.2,0.03988479971885681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.06053119897842407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,1,power_law_1.2,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.06904320120811462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,1,power_law_1.2,0.05440000295639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.10121599435806275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,1,power_law_1.2,0.06096000075340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.10716160535812377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,1,power_law_1.2,0.08963199853897094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.1093567967414856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,balanced,5.137605349222819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,1,power_law_1.2,0.0979200005531311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.11597440242767335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,1,power_law_1.2,0.09978240132331848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.12454400062561036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,1,power_law_1.2,0.10266879796981812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.12910079956054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,1,power_law_1.2,0.10751359462738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.14014079570770263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,1,power_law_1.2,0.1199679970741272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.1447424054145813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,1,power_law_1.2,0.12553600072860718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.1379263997077942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,1,power_law_1.2,0.13215999603271483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.15058560371398927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,1,power_law_1.2,0.13797119855880738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.1594879984855652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,1,power_law_1.2,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.17994879484176635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.23593599796295167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,1,power_law_1.2,0.16605440378189087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,1,power_law_1.2,0.1886016011238098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.23957760334014894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,1,power_law_1.2,0.22456960678100585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.31166079044342043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,1,power_law_1.2,0.24783360958099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.3716543912887573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,1,power_law_1.2,0.30840320587158204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.48479361534118653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,1,power_law_1.2,0.3799295902252197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.6261951923370361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,1,power_law_1.2,0.5168191909790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.920025634765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,1,power_law_1.2,0.6439104080200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,1,power_law_1.2,1.2407296180725098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,1,power_law_1.2,0.9534463882446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,1,power_law_1.2,1.8868864059448243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,1,power_law_1.2,1.3019264221191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,1,power_law_1.2,2.467046356201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,1,power_law_1.2,1.9764991760253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,1,power_law_1.2,3.166169548034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,balanced,9.914021174112955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,1,power_law_1.2,2.692697525024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,1,power_law_1.2,5.109478378295899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,1,power_law_1.2,3.3809024810791017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,1,power_law_1.2,5.326988983154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,1,power_law_1.2,10.14967041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,balanced,10.330421447753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,1,power_law_1.2,10.774969482421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,balanced,0.08451199531555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,balanced,0.0766133318344752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,balanced,0.07604800164699554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,balanced,0.10653866330782573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,balanced,0.1625866691271464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,balanced,0.20064000288645426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,balanced,0.05685866872469584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,balanced,0.20284799734751383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,balanced,0.05700799822807312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,balanced,0.20014933745066324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,balanced,0.07849066456158955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,balanced,0.19926400979359946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,balanced,0.11241066455841064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,balanced,0.2006453275680542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,balanced,0.12593600153923035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,balanced,0.20132267475128174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,balanced,0.12800533572832742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,balanced,0.20248534282048544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,balanced,0.12801600495974222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,balanced,0.20383999745051065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,balanced,0.1284213364124298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,balanced,0.057189335425694786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,balanced,0.20595733324686685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,balanced,0.13061867157618204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,balanced,0.05451733370621999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,balanced,0.20804266134897867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,balanced,0.13130666812260947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,balanced,0.057349334160486855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,balanced,0.13149333000183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,balanced,0.07981333136558533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,balanced,0.21925866603851318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,balanced,0.11685333649317424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,balanced,0.1341813306013743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,balanced,0.21688000361124674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,balanced,0.12156266967455547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,balanced,0.13582932949066162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,balanced,0.12337600191434224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,balanced,0.26444266239802044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,balanced,0.12358933687210083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,balanced,0.14164800445238748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,balanced,0.12379200259844463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,balanced,0.14301333824793497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,balanced,0.2334293325742086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,balanced,0.12450133760770161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,balanced,0.14776000380516052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,balanced,0.12610133488972983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,balanced,0.28178133567174274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,balanced,0.12709333499272665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,balanced,0.16915732622146606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,balanced,0.1291146675745646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,balanced,0.26764265696207684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,balanced,0.1681600014368693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,balanced,0.13099732995033264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,balanced,0.13614400227864584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,balanced,0.20042665799458823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,balanced,0.37646400928497314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,balanced,0.20570667584737143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,balanced,0.3301546573638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,balanced,0.2678613265355428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,balanced,0.137882669766744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,balanced,0.5173813501993815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,balanced,0.28384532531102497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,balanced,0.14323733250300089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,balanced,0.42138667901357013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,balanced,0.5562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,balanced,0.47226667404174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,balanced,0.15338666240374246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,balanced,0.1627840002377828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,balanced,0.6898880004882812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,balanced,0.6806613604227701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,balanced,0.1816320021947225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,balanced,0.9186506271362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,balanced,0.19798932472864786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.20426878929138184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.18332159519195557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,balanced,0.26012800137201947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.1322368025779724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.11900800466537476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,balanced,0.8492213090260824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.20252161026000975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.11783679723739623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.11669119596481323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.10633599758148193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.08271999955177307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,balanced,0.2903306682904561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.14730240106582643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.11934720277786255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.10060160160064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,power_law_1.01,0.12302720546722412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.18167680501937866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.10712319612503052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.12880640029907225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.18689279556274413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.1218176007270813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.15292160511016845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,power_law_1.01,0.10747519731521607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.11829760074615478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.19212160110473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,balanced,1.079802672068278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.17593599557876588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,power_law_1.01,0.07339519858360291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.1272063970565796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.18607360124588013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,power_law_1.01,0.09566079974174499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.11958400011062623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.17825920581817628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.19877760410308837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,balanced,0.3942986726760864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.1317055940628052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,power_law_1.01,0.10551680326461792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.19009920358657836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.2032639980316162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.1229632019996643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,balanced,0.999013344446818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,power_law_1.01,0.11969920396804809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.19901440143585206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.2274240016937256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.1373247981071472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.22164480686187743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,power_law_1.01,0.11907199621200562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.22779519557952882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.14303359985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.23677439689636232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.13916800022125245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.24180479049682618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,power_law_1.01,0.11994240283966065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,1,32,power_law_1.2,0.12600959539413453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.15349760055541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.2717184066772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.24584319591522216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,power_law_1.01,0.12337280511856079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.1593791961669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.2798912048339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.24272639751434327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,1,32,power_law_1.2,0.0717248022556305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,power_law_1.01,0.1318336009979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.18094719648361207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,balanced,0.5331999858220419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.28247039318084716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.2863935947418213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,1,32,power_law_1.2,0.0805184006690979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.21226880550384522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,power_law_1.01,0.13934719562530518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.01,0.42170238494873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.3037823915481567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.22469120025634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,1,32,power_law_1.2,0.09534720182418824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,power_law_1.01,0.14009599685668944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.33660159111022947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.33552000522613523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.27638399600982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,power_law_1.01,0.13625600337982177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,1,32,power_law_1.2,0.09599999785423279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,1,32,power_law_1.2,0.47438721656799315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.01,0.43123202323913573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.29910399913787844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,power_law_1.01,0.17039999961853028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,1,32,power_law_1.2,0.3966016054153442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,1,32,power_law_1.2,0.11829760074615478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,balanced,1.596410592397054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.01,0.5019455909729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,0.4084159851074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,1,32,power_law_1.2,0.5047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,1,32,power_law_1.2,0.12501120567321777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,power_law_1.01,0.1753216028213501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.01,0.5678912162780761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,balanced,0.7330026626586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,0.45946240425109863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,1,32,power_law_1.2,0.506924819946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,1,32,power_law_1.2,0.1289791941642761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.01,0.6336512088775634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,0.7144256114959717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,1,32,power_law_1.2,0.7040512084960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,1,32,power_law_1.2,0.1306496024131775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.01,0.9131967544555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,power_law_1.01,0.17741440534591674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,1,32,power_law_1.2,0.1266495943069458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,0.8196991920471192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,1,32,power_law_1.2,0.8796928405761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,balanced,1.5185813903808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.01,1.0804224014282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,1,32,power_law_1.2,0.13771519660949708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,1,32,power_law_1.2,1.0728896141052247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,1.3628352165222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.01,1.5926783561706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,1,32,power_law_1.2,0.14705920219421387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,1,32,power_law_1.2,1.637606430053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,1.5210495948791505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,power_law_1.01,0.18264319896697997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.01,2.278483200073242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,1,32,power_law_1.2,0.15304960012435914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,1,32,power_law_1.2,2.6234176635742186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,1,32,power_law_1.2,0.15245440006256103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.01,2.0359935760498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.01,2.718931198120117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,1,32,power_law_1.2,0.17007360458374024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,balanced,0.9843733310699463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,1,32,power_law_1.2,3.058745574951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.01,3.2368831634521484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,power_law_1.01,0.21276159286499025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.01,5.234809494018554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,1,32,power_law_1.2,0.16876159906387328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,1,32,power_law_1.2,5.251091384887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,1,32,power_law_1.2,0.20088319778442382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.01,0.2560256004333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.01,6.233958435058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,1,32,power_law_1.2,0.2600255966186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.01,7.75006103515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,1,32,power_law_1.2,7.826668548583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,1,32,power_law_1.2,0.2580159902572632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,1,32,power_law_1.2,0.32885758876800536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.01,0.29241600036621096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,power_law_1.2,15.765037536621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,1,32,power_law_1.2,0.3562304019927979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.01,0.36981759071350095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,1,32,power_law_1.2,0.4955584049224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.01,0.4607423782348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,1,32,power_law_1.2,0.5539584159851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.01,0.7394752025604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,balanced,1.194421370824178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,1,32,power_law_1.2,0.8119935989379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.01,0.9687552452087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,1,32,power_law_1.2,1.1442815780639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.01,1.349561595916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,1,32,power_law_1.2,1.9
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.01,1.9262527465820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,1,32,power_law_1.2,2.651315116882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,1,32,power_law_1.2,2.910438346862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.01,2.9450048446655273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,1,32,balanced,3.1954825719197593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,power_law_1.01,3.0945600509643554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,1,32,power_law_1.2,6.849785614013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,power_law_1.01,4.922118377685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,power_law_1.2,11.376179504394532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,1,32,balanced,2.940890630086263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,power_law_1.01,9.517721557617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,balanced,1.884885311126709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,balanced,3.7645492553710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,1,32,power_law_1.2,0.11720960140228272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,1,32,power_law_1.2,0.07036160230636597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,1,32,power_law_1.2,0.07351040244102477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,1,32,power_law_1.2,0.09185919761657715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,balanced,0.0714026689529419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,1,32,power_law_1.2,0.101363205909729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,balanced,0.05784533421198527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,balanced,0.06898133456707001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,1,32,power_law_1.2,0.10832639932632446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,balanced,0.053264002005259194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,balanced,0.07167466481526692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,1,32,power_law_1.2,0.1162559986114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,balanced,0.059546664357185364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,balanced,0.10754666725794475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,1,32,power_law_1.2,0.12753280401229858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,balanced,0.07871999839941661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,balanced,0.16160000363985697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,balanced,0.11308800180753072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,balanced,0.19510400295257568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,1,32,power_law_1.2,0.12776960134506227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,balanced,0.12633599837621054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,balanced,0.20247467358907065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,1,32,power_law_1.2,0.12688640356063843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,balanced,0.1966879963874817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,balanced,0.1285706659158071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,1,32,power_law_1.2,0.13431040048599244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,balanced,0.19637866814931235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,balanced,0.12846933801968893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,1,32,power_law_1.2,0.13924479484558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,balanced,0.1975626746813456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,balanced,0.12935466567675272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,1,32,power_law_1.2,0.15279359817504884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,balanced,0.13019733627637228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,balanced,0.19821866353352866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,1,32,power_law_1.2,0.17106560468673707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,balanced,0.1322719951470693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,balanced,0.19911466042200723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,1,32,power_law_1.2,0.1837056040763855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,balanced,0.13265599807103476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,balanced,0.2008799910545349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,balanced,0.13477333386739096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,balanced,0.20306134223937988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,balanced,0.13632532954216003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,balanced,0.20764267444610596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,1,32,power_law_1.2,0.18782080411911012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,balanced,0.14326399564743042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,balanced,0.21529066562652588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,balanced,0.1449066698551178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,balanced,0.21944532791773477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,1,32,power_law_1.2,0.22998399734497071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,balanced,0.15004799763361612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,balanced,0.2568853298823039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.01,0.11889280080795288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.01,0.17674880027770995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,balanced,0.17357865969340006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,balanced,0.2366186579068502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.01,0.10461440086364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,1,32,power_law_1.2,0.23164160251617433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.01,0.1964416027069092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,balanced,0.17426133155822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.01,0.0685375988483429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,balanced,0.291701336701711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.2,0.2912512063980103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.01,0.08440960049629212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.01,0.08999680280685425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,balanced,0.2104853391647339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.01,0.09186559915542603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,balanced,0.27403199672698975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.01,0.11735039949417114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.01,0.11478400230407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.01,0.12014720439910889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.01,0.12466559410095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,balanced,0.2188160022099813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.2,0.339136004447937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.01,0.12491519451141357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,balanced,0.3642666737238566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.01,0.16174720525741576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,balanced,0.04497600098450979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,power_law_1.01,0.11259520053863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.01,0.1214143991470337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.2,0.4302527904510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.01,0.18862719535827638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.01,0.12486399412155151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,balanced,0.2852746645609538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,balanced,0.04548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.2,0.5537919998168945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,power_law_1.01,0.10296319723129273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.01,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.01,0.17827839851379396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,balanced,0.34772801399230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,balanced,0.056885331869125366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.01,0.1288831949234009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.2,0.78056321144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.01,0.182259202003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.01,0.13627519607543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,balanced,0.07449600100517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,power_law_1.01,0.08132479786872863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,balanced,0.30726399024327594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.01,0.13602559566497802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,balanced,0.11628799637158711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.01,0.19148800373077393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.2,1.1975744247436524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.01,0.14421759843826293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,power_law_1.01,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,balanced,0.12129599849383037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.01,0.15399680137634278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,balanced,0.5352160135904948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.01,0.19425920248031617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,power_law_1.01,0.11308159828186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,balanced,0.12304533521334331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.01,0.17128959894180298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.2,1.953753662109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,power_law_1.01,0.11808639764785767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,balanced,0.12349866827329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.01,0.20149760246276854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,balanced,0.4490453402201335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.01,0.20842878818511962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,balanced,0.12407466769218445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.01,0.21420800685882568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,power_law_1.01,0.12524160146713256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.2,2.611174392700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.01,0.2630784034729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,balanced,0.12583999832471213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.01,0.19992320537567138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,power_law_1.01,0.12300800085067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,balanced,0.5918613274892172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.01,0.2650048017501831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.2,4.486201477050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,balanced,0.1274720033009847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,power_law_1.01,0.12718080282211303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.01,0.2106175899505615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.01,0.37407360076904295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,balanced,0.1276479959487915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,power_law_1.01,0.13165440559387206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,1,32,power_law_1.2,5.27325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.01,0.4234816074371338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,balanced,0.5441973209381104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.01,0.21806080341339112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,balanced,0.13019733627637228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,power_law_1.01,0.1428096055984497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.01,0.5746880054473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,balanced,0.13236266374588013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.01,0.24044160842895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.01,0.765772819519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,power_law_1.01,0.14730240106582643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,1,32,power_law_1.2,9.814476776123048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,balanced,0.13914133111635843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.01,0.2644479990005493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.01,1.1016511917114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,power_law_1.01,0.15868159532546997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,balanced,0.721781333287557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.01,0.347052788734436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.01,1.3644224166870118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,power_law_1.01,0.1673472046852112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,1,32,power_law_1.2,16.387692260742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,16,power_law_1.2,0.17575039863586425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.01,0.2877568006515503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.01,1.9406976699829102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.01,0.38883841037750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,balanced,0.7039306958516439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,16,power_law_1.2,0.11701120138168335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.01,3.0474048614501954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,balanced,0.14103999733924866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,power_law_1.01,0.16807680130004882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,16,power_law_1.2,0.0966592013835907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.01,0.3826495885848999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,16,power_law_1.2,0.11126400232315063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.01,5.59288330078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.01,0.48869757652282714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,16,power_law_1.2,0.11904640197753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,16,power_law_1.2,0.15546239614486695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.01,0.5850175857543946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,16,power_law_1.2,0.17738239765167235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,balanced,0.9356586933135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.01,0.7685184001922607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,16,power_law_1.2,0.17813119888305665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,power_law_1.01,0.18161280155181886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,balanced,0.14784533778826395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,16,power_law_1.2,0.1887935996055603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.01,0.9513407707214355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,16,power_law_1.2,0.18844799995422362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,balanced,0.9307786623636881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.01,1.4501376152038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,16,power_law_1.2,0.18963840007781982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,16,power_law_1.2,0.20008320808410646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.01,1.83239688873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,16,power_law_1.2,0.21048319339752197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.01,2.1252479553222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,16,power_law_1.2,0.2074944019317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.01,3.909747314453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,power_law_1.01,0.20814719200134277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,16,power_law_1.2,0.22124159336090088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,balanced,0.16081066926320395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,power_law_1.01,0.24702720642089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,16,power_law_1.2,0.23244800567626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,balanced,1.0993813673655193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,balanced,0.1727893352508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.01,7.596173095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,16,power_law_1.2,0.2667327880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,16,power_law_1.2,0.32794239521026614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,16,power_law_1.2,0.32094080448150636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,balanced,1.1190880139668782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,16,power_law_1.2,0.45326719284057615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,16,power_law_1.2,0.42872958183288573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,16,power_law_1.2,0.5950911998748779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,16,power_law_1.2,0.6655424118041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,power_law_1.01,0.2794303894042969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,balanced,0.1982240080833435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,16,power_law_1.2,0.9464768409729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,power_law_1.01,0.3717119932174683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,16,power_law_1.2,1.4322367668151856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,balanced,0.21965867280960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,power_law_1.01,0.479315185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,16,power_law_1.2,1.6619840621948243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,power_law_1.01,0.5920703887939454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,16,power_law_1.2,2.7453439712524412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,balanced,0.3006346623102824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,16,power_law_1.2,3.1092927932739256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,power_law_1.2,4.721702575683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,balanced,0.3582133452097575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,power_law_1.01,0.8870207786560058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,16,balanced,1.727728048960368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,power_law_1.2,11.044684600830077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,power_law_1.01,1.195199966430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,balanced,1.6930239995320637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,balanced,0.49872533480326336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,power_law_1.01,1.7808000564575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,power_law_1.01,2.3418048858642577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,power_law_1.01,2.85361270904541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,balanced,0.6334559917449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,power_law_1.01,4.671129608154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,power_law_1.01,9.235276794433593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,balanced,0.8890079657236735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,balanced,1.1852800051371257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,16,balanced,3.247333208719889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,balanced,3.2793652216593423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,balanced,1.4458506902058919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,balanced,2.2870613733927407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,16,power_law_1.2,0.11654399633407593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,16,power_law_1.2,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,16,power_law_1.2,0.06954240202903747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,16,power_law_1.2,0.07724159955978394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,16,power_law_1.2,0.08579199910163879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,16,power_law_1.2,0.11571840047836304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,16,power_law_1.2,0.11832959651947021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,16,power_law_1.2,0.1255552053451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,16,power_law_1.2,0.12010879516601562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,16,power_law_1.2,0.12573440074920655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,16,power_law_1.2,0.129203200340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,16,power_law_1.2,0.13123199939727784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,16,power_law_1.2,0.13852159976959227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,16,power_law_1.2,0.11304320096969604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,16,power_law_1.2,0.1417407989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,16,power_law_1.2,0.06814079880714416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,16,power_law_1.2,0.15441919565200807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,16,power_law_1.2,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,16,power_law_1.2,0.16104960441589355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,16,power_law_1.2,0.0791487991809845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,16,power_law_1.2,0.18478720188140868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,16,power_law_1.2,0.08862720131874084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,16,power_law_1.2,0.21923840045928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,16,power_law_1.2,0.11467519998550416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,16,power_law_1.2,0.2335103988647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,16,power_law_1.2,0.29887359142303466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,16,power_law_1.2,0.11797120571136474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,16,power_law_1.2,0.3066431999206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,16,power_law_1.2,0.12355200052261353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,16,power_law_1.2,0.4345344066619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,16,power_law_1.2,0.12438399791717529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,16,power_law_1.2,0.5419904232025147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,16,power_law_1.2,0.12722560167312622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,16,power_law_1.2,0.6692351818084716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,16,power_law_1.2,0.12691199779510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,16,power_law_1.2,0.8298239707946777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,16,power_law_1.2,0.14108799695968627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,16,power_law_1.2,1.2871744155883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,16,power_law_1.2,0.1435263991355896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,16,power_law_1.2,0.1573184013366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,16,power_law_1.2,2.101055908203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,16,power_law_1.2,0.17935359477996826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,balanced,4.542943954467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,16,power_law_1.2,2.460153579711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,balanced,0.05797333518664042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,16,power_law_1.2,3.6976577758789064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,16,power_law_1.2,0.17763839960098265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,balanced,0.059578667084376015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,balanced,0.07131733496983846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,16,power_law_1.2,7.182125091552734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,balanced,0.10734933614730835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,16,power_law_1.2,0.191046404838562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,balanced,0.17766932646433511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,balanced,0.19613333543141684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,balanced,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,balanced,0.2037866711616516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,balanced,0.19912532965342203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,16,power_law_1.2,0.23405439853668214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,balanced,0.19845332702000937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,balanced,0.056549335519472756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,16,power_law_1.2,0.26831998825073244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,balanced,0.20084265867869058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,balanced,0.07732800145943959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,balanced,0.11306666334470113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,balanced,0.20137600104014078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,balanced,0.2027733325958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,balanced,0.12640532851219177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,16,power_law_1.2,0.3509567975997925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,balanced,0.129120002190272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,balanced,0.2032853364944458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,16,power_law_1.2,0.3909440040588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,balanced,0.13006933530171713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,balanced,0.20689600706100464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,16,power_law_1.2,0.6857984066009521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,balanced,0.13064000010490417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,balanced,0.21239999930063883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,balanced,0.1329866647720337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,16,power_law_1.2,0.7449408054351807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,balanced,0.21942933400472006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,balanced,0.13505599896113077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,balanced,0.228767991065979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,balanced,0.13395733634630838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,16,power_law_1.2,1.0707136154174806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,balanced,0.26808534065882367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,balanced,0.13709333539009094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,balanced,0.2515786687533061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,balanced,0.13904533783594766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,16,power_law_1.2,1.5718655586242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,balanced,0.04498666524887085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,balanced,0.14687466621398926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,balanced,0.3195573290189107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,16,power_law_1.2,2.0983871459960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,balanced,0.046575998266537987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,balanced,0.14984533190727234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,balanced,0.05667733152707418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,balanced,0.29976000388463336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,balanced,0.15633066495259604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,16,power_law_1.2,2.787059211730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,balanced,0.08069866895675659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,balanced,0.18388799826304117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,16,power_law_1.2,4.129062271118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,balanced,0.11657599608103435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,balanced,0.3843413194020589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,balanced,0.12380266189575195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,balanced,0.18444265921910605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,balanced,0.12628799676895142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,16,power_law_1.2,6.98076171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,balanced,0.2311413288116455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,balanced,0.12732799847920737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,balanced,0.40139198303222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,balanced,0.12850667039553323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,balanced,0.2414720058441162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,16,power_law_1.2,15.317433166503907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,balanced,0.12995733817418417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,balanced,0.1320799986521403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,balanced,0.5981493393580118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,balanced,0.13336533308029175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,balanced,0.31189332405726117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,balanced,0.13660266995429993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,balanced,0.14057067036628723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,balanced,0.358240008354187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,balanced,0.14777066310246786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,balanced,0.6866453488667806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.01,0.07693439722061157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.01,0.11117440462112427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,balanced,0.5154773394266764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.01,0.08575360178947448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.01,0.11466879844665527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,balanced,0.15120533108711243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.01,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.01,0.07351040244102477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.01,0.0818943977355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.01,0.10773760080337524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.01,0.08590720295906067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,balanced,0.838752031326294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,balanced,0.6160533428192139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.01,0.11632640361785888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.01,0.10584319829940796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.01,0.11852799654006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.01,0.16636799573898314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,balanced,0.16195733348528543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.01,0.12113280296325683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.01,0.1749567985534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.01,0.1256832003593445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.01,0.12225919961929321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.01,0.18422399759292601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.01,0.12929919958114625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.01,0.17610880136489868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.01,0.13067519664764404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,balanced,0.8318719863891602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.01,0.1881600022315979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.01,0.1375872015953064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,balanced,1.134335994720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.01,0.19095040559768678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.01,0.1411520004272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,balanced,0.1821440060933431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.01,0.1523200035095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.01,0.19541120529174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,balanced,0.19689067204793295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.01,0.1563199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.01,0.19757440090179443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.01,0.1611199975013733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.01,0.2113408088684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.01,0.19540480375289918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.01,0.22220799922943116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.01,0.200927996635437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.01,0.23807361125946044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.01,0.2509567975997925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,balanced,1.0876266956329346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.01,0.23728640079498292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.01,0.28784639835357667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,balanced,0.23868799209594727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.01,0.38782079219818116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.01,0.2891135931015015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.01,0.42371201515197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.01,0.27752320766448973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,balanced,1.3180373509724934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,balanced,0.28521066904067993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.01,0.6208960056304932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.01,0.3458240032196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.01,0.7315968036651611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.01,0.3821887969970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.01,1.0769408226013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,balanced,0.41336532433827716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.01,0.4674816131591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.01,1.5707839965820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.01,0.5092991828918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.01,1.6716032028198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.01,0.7396736145019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,balanced,0.48957868417104083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.01,0.8995840072631835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.01,2.855551910400391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,balanced,1.3046826521555583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.01,1.381708812713623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.01,5.692287826538086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.01,1.598585605621338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.01,2.0114112854003907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.01,3.282662582397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,balanced,0.6850559711456299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.01,5.800505447387695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,balanced,2.0723093350728354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,balanced,0.897594690322876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,power_law_1.01,0.07678080201148987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,balanced,2.0347839991251626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,power_law_1.01,0.08872960209846496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,power_law_1.01,0.06113920211791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,balanced,1.2466826438903809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,power_law_1.01,0.07762560248374939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,power_law_1.01,0.08496639728546143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,8,power_law_1.2,0.11160320043563843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,power_law_1.01,0.1130560040473938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,8,power_law_1.2,0.07523199915885925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,power_law_1.01,0.11781760454177856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,8,power_law_1.2,0.08087679743766785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,8,power_law_1.2,0.10708479881286621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,power_law_1.01,0.11905280351638795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,8,power_law_1.2,0.10815999507904053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,power_law_1.01,0.12518399953842163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,8,power_law_1.2,0.16864000558853148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,balanced,1.6625547409057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,power_law_1.01,0.12676479816436767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,8,power_law_1.2,0.17580800056457518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,8,power_law_1.2,0.18316160440444945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,power_law_1.01,0.13597439527511596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,8,power_law_1.2,0.17285759449005128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,power_law_1.01,0.1366528034210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,8,power_law_1.2,0.1948032021522522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,power_law_1.01,0.14855680465698243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,8,power_law_1.2,0.19990400075912476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,power_law_1.01,0.1567296028137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,8,power_law_1.2,0.1996608018875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,power_law_1.01,0.18234879970550538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,8,power_law_1.2,0.20536320209503173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,8,power_law_1.2,0.20846080780029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,8,power_law_1.2,0.22120320796966553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,power_law_1.01,0.1801408052444458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,balanced,2.0353973706563315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,8,power_law_1.2,0.2298111915588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,8,power_law_1.2,0.26413440704345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,8,power_law_1.2,0.3166975975036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,power_law_1.01,0.18719359636306762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,8,power_law_1.2,0.3080895900726318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,8,power_law_1.2,0.3771967887878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,balanced,3.9844481150309243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,8,power_law_1.2,0.4393727779388428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,power_law_1.01,0.21738879680633544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,8,power_law_1.2,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,power_law_1.01,0.2563647985458374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,8,power_law_1.2,0.6149759769439698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,balanced,4.00544548034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,8,power_law_1.2,0.07719039916992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,8,power_law_1.2,0.8476736068725585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,8,power_law_1.2,0.06376320123672485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,8,power_law_1.2,1.1144319534301759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,power_law_1.01,0.3281856060028076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,8,power_law_1.2,0.059059202671051025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,power_law_1.01,0.41634559631347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,8,power_law_1.2,1.6438848495483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,8,power_law_1.2,0.06622080206871032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,power_law_1.01,0.5878464221954346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,8,power_law_1.2,0.08046720027923585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,8,power_law_1.2,1.8322816848754884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,power_law_1.01,0.6716800212860108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,8,power_law_1.2,0.11419520378112794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,balanced,3.1871840159098306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,8,power_law_1.2,2.3713663101196287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,8,power_law_1.2,0.12119040489196778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,power_law_1.01,1.033459186553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,8,power_law_1.2,0.11768959760665894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,8,power_law_1.2,4.857676696777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,power_law_1.01,1.31845121383667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,8,power_law_1.2,0.12419840097427368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,8,power_law_1.2,0.12499200105667115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,power_law_1.01,2.086809539794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,8,power_law_1.2,7.769676971435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,8,power_law_1.2,0.1294592022895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,power_law_1.01,2.477471923828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,8,power_law_1.2,0.13542399406433106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,power_law_1.01,3.1770751953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,8,power_law_1.2,0.14372479915618896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,8,power_law_1.2,0.1432703971862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,power_law_1.01,4.733388900756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,8,power_law_1.2,0.1520640015602112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,8,power_law_1.2,0.15740159749984742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,power_law_1.01,10.715532684326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,8,power_law_1.2,0.16948479413986206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,8,power_law_1.2,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,8,power_law_1.2,0.22021760940551757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,8,power_law_1.2,0.295795202255249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,8,power_law_1.2,0.29103999137878417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,8,power_law_1.2,0.36690559387207033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,8,power_law_1.2,0.48414077758789065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,8,power_law_1.2,0.7519423961639404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,8,power_law_1.2,0.8925888061523437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,8,power_law_1.2,1.3423295974731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,8,power_law_1.2,1.7529024124145507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,8,power_law_1.2,2.1323968887329103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,balanced,6.383663813273112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,8,power_law_1.2,3.6256256103515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,8,power_law_1.2,8.231014251708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,8,power_law_1.2,0.0812608003616333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,8,power_law_1.2,0.062003201246261595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,8,power_law_1.2,0.05441920161247253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,8,power_law_1.2,0.07156479954719544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,balanced,0.05385066568851471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,8,power_law_1.2,0.08650239706039428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,balanced,0.06028800209363302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,8,power_law_1.2,0.11434240341186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,balanced,0.0730453332265218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,8,power_law_1.2,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,balanced,0.10913599530855815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,balanced,0.1653279960155487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,8,power_law_1.2,0.12469120025634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,balanced,0.20172800620396933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,8,power_law_1.2,0.12492799758911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,balanced,0.20433600743611655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,balanced,0.20488532384236655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,8,power_law_1.2,0.1270591974258423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,balanced,0.20586667458216348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,balanced,0.20588266849517822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,8,power_law_1.2,0.13904000520706178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,balanced,0.20553600788116455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,8,power_law_1.2,0.14469759464263915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,balanced,0.20652800798416138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,8,power_law_1.2,0.15235840082168578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,balanced,0.20755734046300253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,8,power_law_1.2,0.1541759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,balanced,0.21286400159200033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,8,power_law_1.2,0.17774080038070678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,balanced,0.22009599208831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,balanced,0.22945600748062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,balanced,0.23572266101837158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,8,power_law_1.2,0.19062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,balanced,0.28514667352040607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,balanced,0.27937066555023193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,8,power_law_1.2,0.19227520227432252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,balanced,0.37603731950124103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,8,power_law_1.2,0.22406399250030518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,balanced,0.3495466709136963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,8,power_law_1.2,0.2679935932159424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,balanced,0.46861334641774494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,8,power_law_1.2,0.33905279636383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,8,power_law_1.2,0.44715518951416017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,balanced,0.49489065011342365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,8,power_law_1.2,0.7228608131408691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,8,power_law_1.2,0.8434432029724122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,8,power_law_1.2,1.1989439964294433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,balanced,0.7437067031860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,8,power_law_1.2,1.8038080215454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,8,power_law_1.2,1.9676223754882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,balanced,0.04825599988301595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,8,power_law_1.2,2.7124095916748048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,balanced,0.05109866460164388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,balanced,0.05819199979305267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,balanced,0.8536213239034017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,8,power_law_1.2,4.677427291870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,balanced,0.08040533463160197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,balanced,0.11863999565442403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,8,power_law_1.2,6.469087982177735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,balanced,0.1313813328742981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,balanced,0.1344533363978068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,balanced,0.13555199901262918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,8,power_law_1.2,15.144525146484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,balanced,0.051125332713127136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,balanced,0.13743467132250467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,balanced,0.13641066352526346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,balanced,0.05471999943256378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,balanced,1.254245360692342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,balanced,0.13937066992123923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,balanced,0.060133333007494606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,balanced,0.14200533429781595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,balanced,0.08152000109354655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,balanced,0.11743467052777608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,balanced,0.14522133270899454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,balanced,0.13395733634630838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,balanced,0.1497706671555837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,balanced,0.13766933480898538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,balanced,0.1581493318080902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,balanced,0.1381493310133616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,balanced,0.1623360017935435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,balanced,0.1395093301932017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,balanced,0.14244266351064047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,balanced,0.17052799463272095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,balanced,1.616085370381673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,balanced,0.14588800072669983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.01,0.07457919716835022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,balanced,0.20799465974171957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,balanced,0.14877866705258688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,balanced,0.15318933129310608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.01,0.08175359964370728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,balanced,0.20851200819015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,balanced,0.1604266663392385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.01,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,balanced,0.17082132895787558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.01,0.10226559638977051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,balanced,0.25737067063649494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.01,0.11637760400772094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.01,0.058739197254180905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.01,0.16313600540161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,balanced,0.28390934069951373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.01,0.16505600214004518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.01,0.06721919775009155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.01,0.1654528021812439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.01,0.05868160128593445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,balanced,0.17997332413991293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.01,0.18224639892578126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,balanced,0.3753066857655843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.01,0.07445120215415954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.01,0.1880959987640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,balanced,1.7824692726135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.01,0.08459519743919372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.01,0.19697279930114747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.01,0.11604479551315308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,balanced,0.44788801670074463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.01,0.20286719799041747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.01,0.12148480415344239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.01,0.20533759593963624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,balanced,0.19404266277949014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.01,0.21747200489044188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.01,0.12344319820404052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.01,0.22004480361938478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.01,0.12208640575408936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,balanced,0.6621760129928589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.01,0.23412480354309081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.01,0.1296447992324829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.01,0.26117119789123533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.01,0.13393280506134034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.01,0.297875189781189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.01,0.14123519659042358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.01,0.31215360164642336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,balanced,0.23137599229812622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.01,0.38700160980224607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.01,0.1502079963684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,balanced,0.8197546799977621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.01,0.41120638847351076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.01,0.14740480184555055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,balanced,0.2733599940935771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.01,0.4933504104614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.01,0.15998719930648803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.01,0.6557504177093506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.01,0.16424959897994995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.01,0.8314751625061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.01,0.20051200389862062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,4,power_law_1.2,0.07489920258522034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,balanced,2.908752123514811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.01,1.0935104370117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.01,0.2145087957382202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,balanced,0.35155200958251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,4,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.01,1.5870016098022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.01,0.22768640518188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,4,power_law_1.2,0.07089920043945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.01,1.9840768814086913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,balanced,1.2025012969970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,balanced,0.42100266615549725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.01,0.29144959449768065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.01,2.2620288848876955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,4,power_law_1.2,0.10194560289382934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,power_law_1.01,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.01,0.3287103891372681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,4,power_law_1.2,0.11115520000457764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.01,3.555583953857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,balanced,0.6096053520838419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,power_law_1.01,0.07793279886245727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.01,0.4008768081665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,4,power_law_1.2,0.15578240156173706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,power_law_1.01,0.06355839967727661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.01,0.5681151866912841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.01,8.176486206054687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,4,power_law_1.2,0.17305599451065062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,balanced,0.7429493268330892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,power_law_1.01,0.07863680124282837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.01,0.73056001663208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,4,power_law_1.2,0.17262719869613646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,power_law_1.01,0.08851199746131896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.01,0.9408127784729003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,4,power_law_1.2,0.1862912058830261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,balanced,1.5049120585123699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,power_law_1.01,0.1196671962738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.01,1.437337589263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,4,power_law_1.2,0.18129279613494872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,balanced,1.0738506317138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,power_law_1.01,0.12629760503768922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,4,power_law_1.2,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.01,1.7792703628540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,power_law_1.01,0.13375999927520751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,4,power_law_1.2,0.20393600463867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.01,2.306374359130859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,power_law_1.01,0.13175040483474731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,4,power_law_1.2,0.21481599807739257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,power_law_1.01,0.13498239517211913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.01,3.486105728149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,balanced,1.4119200706481934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,4,power_law_1.2,0.21188480854034425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,4,power_law_1.2,0.23192958831787108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,power_law_1.01,0.14627200365066528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.01,7.003359985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,4,power_law_1.2,0.24065918922424318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,power_law_1.01,0.1564736008644104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,4,power_law_1.2,0.2664639949798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,balanced,1.8214772542317708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,power_law_1.01,0.16524159908294678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,4,power_law_1.2,0.3035072088241577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,power_law_1.01,0.17870080471038818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,4,power_law_1.2,0.32807040214538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,balanced,1.9962612787882488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,power_law_1.01,0.19942400455474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,4,power_law_1.2,0.3869184017181396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,4,power_law_1.2,0.4394752025604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,4,power_law_1.2,0.5432384014129639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,power_law_1.01,0.20716800689697265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,4,power_law_1.2,0.6807104110717773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,balanced,5.397466659545898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,4,power_law_1.2,0.9463680267333985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,power_law_1.01,0.22254719734191894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,4,power_law_1.2,1.1920255661010741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,balanced,2.646341323852539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,4,power_law_1.2,1.5796992301940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,4,power_law_1.2,2.2862592697143556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,power_law_1.01,0.2657984018325806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,4,power_law_1.2,2.8239871978759767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,power_law_1.01,0.34048640727996826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,balanced,2.8260320027669272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,4,power_law_1.2,4.9585216522216795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,power_law_1.01,0.41804161071777346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,power_law_1.01,0.5182464122772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,4,power_law_1.2,8.411942291259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,power_law_1.01,0.690937614440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,balanced,3.2341651916503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,power_law_1.01,0.9059840202331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,power_law_1.01,1.3805567741394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,power_law_1.01,1.6013376235961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,power_law_1.01,2.460825538635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,4,power_law_1.2,0.059059202671051025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,power_law_1.01,3.276095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,4,power_law_1.2,0.052767997980117796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,power_law_1.01,4.413235092163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,4,power_law_1.2,0.058323198556900026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,4,power_law_1.2,0.07301759719848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,power_law_1.01,7.229580688476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,4,power_law_1.2,0.0828544020652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,4,power_law_1.2,0.11411839723587036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,power_law_1.01,13.360972595214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,4,power_law_1.2,0.12093440294265748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,balanced,5.107066790262858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,4,power_law_1.2,0.12259839773178101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,4,power_law_1.2,0.12636799812316896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,4,power_law_1.2,0.12958719730377197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,4,power_law_1.2,0.13843200206756592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,4,power_law_1.2,0.14384000301361083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,4,power_law_1.2,0.14978560209274291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,4,power_law_1.2,0.15047039985656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,balanced,5.592458724975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,4,power_law_1.2,0.16909439563751222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,4,power_law_1.2,0.17238399982452393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,4,power_law_1.2,0.1816256046295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,4,power_law_1.2,0.21413760185241698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,4,power_law_1.2,0.23767681121826173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,4,power_law_1.2,0.2991487979888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,4,power_law_1.2,0.3428735971450806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,4,power_law_1.2,0.4612800121307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,4,power_law_1.2,0.5898816108703613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,4,power_law_1.2,0.8490559577941894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,4,power_law_1.2,1.1469823837280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,4,power_law_1.2,1.5909567832946778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,4,power_law_1.2,2.065465545654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,4,power_law_1.2,2.866924858093262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,4,power_law_1.2,3.5403583526611326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,balanced,10.228517532348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,4,power_law_1.2,8.882476806640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,4,power_law_1.2,0.06718080043792725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,4,power_law_1.2,0.05603839755058289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,4,power_law_1.2,0.06121600270271301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,4,power_law_1.2,0.07430400252342224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,4,power_law_1.2,0.08234879970550538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,4,power_law_1.2,0.11719039678573609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,4,power_law_1.2,0.1249343991279602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,4,power_law_1.2,0.12718080282211303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,4,power_law_1.2,0.133241605758667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,4,power_law_1.2,0.14298880100250244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,4,power_law_1.2,0.1491968035697937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,4,power_law_1.2,0.1568384051322937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,4,power_law_1.2,0.1747712016105652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,4,power_law_1.2,0.18165760040283202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,4,power_law_1.2,0.19869439601898192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,balanced,0.05481066803137461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,4,power_law_1.2,0.206278395652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,balanced,0.06484800080458324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,balanced,0.0787306676308314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,4,power_law_1.2,0.23180160522460938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,balanced,0.11539733409881592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,balanced,0.1755253275235494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,balanced,0.21100799242655435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,4,power_law_1.2,0.2597120046615601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,balanced,0.05115200082461039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,balanced,0.21406400203704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,4,power_law_1.2,0.33283200263977053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,balanced,0.2179786761601766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,balanced,0.05418666700522105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,balanced,0.21847466627756754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,4,power_law_1.2,0.44188799858093264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,balanced,0.06457599997520447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,balanced,0.2232159972190857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,balanced,0.09158933162689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,4,power_law_1.2,0.5594880104064941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,balanced,0.22500266631444296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,balanced,0.1334933340549469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,4,power_law_1.2,0.7678719997406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,balanced,0.2296853264172872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,4,power_law_1.2,1.0670528411865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,balanced,0.15127999583880106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,balanced,0.232314666112264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,4,power_law_1.2,1.46496639251709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,balanced,0.15383999546368918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,balanced,0.2421333392461141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,4,power_law_1.2,1.798054313659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,balanced,0.1532266636689504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,balanced,0.2541813254356384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,balanced,0.15565866231918335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,4,power_law_1.2,2.861926460266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,balanced,0.25757867097854614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,balanced,0.1586240033308665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,4,power_law_1.2,3.689651107788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,balanced,0.266704003016154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,balanced,0.15820266803105673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,4,power_law_1.2,4.28210563659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,balanced,0.32472532987594604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,balanced,0.16141866644223532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,balanced,0.06497600177923839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,balanced,0.3170986572901408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,balanced,0.16396266222000122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,4,power_law_1.2,8.815296173095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,balanced,0.0691893349091212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,balanced,0.40507201353708905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,balanced,0.1718026598294576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,balanced,0.0783786674340566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,balanced,0.18126932779947916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,4,power_law_1.2,15.837484741210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,balanced,0.10756799578666687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,balanced,0.44844265778859455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,balanced,0.14594133694966635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,balanced,0.19058666626612344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,balanced,0.16209066907564798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,balanced,0.16679465770721436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,balanced,0.6624639828999838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,balanced,0.20470933119455972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,balanced,0.1698346734046936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,balanced,0.17252800861994425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,balanced,0.2718506654103597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,balanced,0.17746132612228394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,balanced,0.7160320281982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,balanced,0.18257067600886026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,balanced,0.2595679958661397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.01,0.07179520130157471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,balanced,0.19033066431681314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,balanced,0.3197653293609619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.01,0.06504960060119629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,balanced,0.1979680061340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,balanced,1.1400266488393147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,balanced,0.20939199129740396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.01,0.0661952018737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,balanced,0.3662559986114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,balanced,0.22095467646916708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.01,0.09111679792404175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.01,0.12371200323104858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,balanced,0.5541866620381674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,balanced,1.3142879803975422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.01,0.1675647974014282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.01,0.1739776015281677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,balanced,0.24174400170644125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,balanced,0.6590079863866171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.01,0.1897536039352417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.01,0.05317760109901428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.01,0.19543039798736572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.01,0.06071680188179016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.01,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.01,0.19983999729156493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,balanced,1.0059200127919514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.01,0.08080639839172363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,balanced,2.018885294596354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.01,0.21266560554504393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,balanced,0.2767840027809143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.01,0.09132159948348999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.01,0.22199680805206298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.01,0.23029758930206298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.01,0.12374399900436402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.01,0.25132160186767577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,balanced,1.2430986563364665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.01,0.13344000577926635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.01,0.2690112113952637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.01,0.27589120864868166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,balanced,0.3670719861984253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.01,0.13986560106277465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.01,0.3076927900314331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,balanced,0.4283733367919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.01,0.14162559509277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,balanced,2.449578603108724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.01,0.35085439682006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.01,0.3625152111053467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,balanced,0.5632160107294718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.01,0.1520640015602112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,balanced,1.864949385325114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.01,0.41201281547546387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.01,0.15261440277099608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,balanced,0.6880319913228353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.01,0.488921594619751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.01,0.16224000453948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.01,0.6882304191589356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.01,0.1679487943649292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,balanced,1.0198506514231365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.01,0.9412991523742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.01,0.17198079824447632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.01,1.2511808395385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.01,0.19676799774169923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.01,1.4933183670043946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,balanced,1.2688053448994954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.01,0.2056447982788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,balanced,2.8972107569376626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,balanced,2.2795626322428384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.01,2.2697919845581054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.01,0.22004480361938478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,2,power_law_1.2,0.07169280052185059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.01,0.27733759880065917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.01,2.8953792572021486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,balanced,1.8441492716471355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,2,power_law_1.2,0.06340479850769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.01,0.2820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,power_law_1.01,0.06581760048866273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.01,3.326649475097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,2,power_law_1.2,0.0710591971874237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.01,0.34600319862365725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,power_law_1.01,0.07335039973258972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,2,power_law_1.2,0.09176959991455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.01,0.4254144191741943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.01,5.508428955078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,power_law_1.01,0.07511039972305297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,2,power_law_1.2,0.11014399528503419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.01,0.5592448234558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,power_law_1.01,0.0917568027973175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,2,power_law_1.2,0.17240320444107055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,balanced,2.412597338358561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,power_law_1.01,0.10568959712982177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.01,0.6975872039794921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.01,10.069779205322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,2,power_law_1.2,0.18287999629974366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,power_law_1.01,0.1416640043258667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,2,power_law_1.2,0.19515520334243774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.01,1.0246591567993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,balanced,2.718111991882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,power_law_1.01,0.15022079944610595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,2,power_law_1.2,0.19752960205078124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,power_law_1.01,0.15508480072021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.01,1.3410240173339845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,2,power_law_1.2,0.20933120250701903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,power_law_1.01,0.1617535948753357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.01,1.8414272308349608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,2,power_law_1.2,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,power_law_1.01,0.170579195022583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,balanced,3.4726826349894204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,power_law_1.01,0.18350080251693726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,2,power_law_1.2,0.23161599636077881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.01,2.3040960311889647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,power_law_1.01,0.19738880395889283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,2,power_law_1.2,0.2358720064163208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,balanced,4.5065867106119795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,power_law_1.01,0.20949759483337402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.01,3.0950143814086912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,2,power_law_1.2,0.2503999948501587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,power_law_1.01,0.2277695894241333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,2,power_law_1.2,0.2693824052810669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,power_law_1.01,0.2522176027297974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.01,4.8862144470214846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,2,power_law_1.2,0.27947518825531004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,2,power_law_1.2,0.3109568119049072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.01,9.789657592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,power_law_1.01,0.27035520076751707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,2,power_law_1.2,0.363974404335022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,balanced,4.607717196146647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,2,power_law_1.2,0.36637439727783205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,power_law_1.01,0.311955189704895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,2,power_law_1.2,0.43511037826538085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,balanced,4.3245547612508135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,2,power_law_1.2,0.5428160190582275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,power_law_1.01,0.3805824041366577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,2,power_law_1.2,0.6531583786010742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,power_law_1.01,0.4617919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,2,power_law_1.2,0.9695743560791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,power_law_1.01,0.6293951988220214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,2,power_law_1.2,1.179155158996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,power_law_1.01,0.7578688144683838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,power_law_1.01,1.0792256355285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,2,power_law_1.2,1.6422399520874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,power_law_1.01,1.3936063766479492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,balanced,5.642080307006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,2,power_law_1.2,2.462848091125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,power_law_1.01,1.9711616516113282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,power_law_1.01,2.931571197509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,2,power_law_1.2,2.907257652282715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,power_law_1.01,4.139583969116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,2,power_law_1.2,3.3116607666015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,power_law_1.01,5.053631973266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,2,power_law_1.2,5.023136138916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,power_law_1.01,6.348652648925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,power_law_1.2,11.421324920654296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,power_law_1.01,10.343443298339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,power_law_1.01,21.7503173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,2,balanced,9.153605143229166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,balanced,8.992757161458334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,2,power_law_1.2,0.05319039821624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,2,power_law_1.2,0.05232639908790589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,2,power_law_1.2,0.056908798217773435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,2,power_law_1.2,0.0751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,2,power_law_1.2,0.08579199910163879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,balanced,8.868895848592123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,2,power_law_1.2,0.12392319440841675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,2,power_law_1.2,0.13530240058898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,2,power_law_1.2,0.14200960397720336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,2,power_law_1.2,0.14413440227508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,2,power_law_1.2,0.15275520086288452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,2,power_law_1.2,0.15546239614486695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,2,power_law_1.2,0.1668352007865906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,2,power_law_1.2,0.16902400255203248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,2,power_law_1.2,0.18458240032196044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,2,power_law_1.2,0.19882880449295043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,2,power_law_1.2,0.20745599269866943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,2,power_law_1.2,0.2222912073135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,2,power_law_1.2,0.27461121082305906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,2,power_law_1.2,0.28998401165008547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,2,power_law_1.2,0.3474560022354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,2,power_law_1.2,0.4355264186859131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,2,power_law_1.2,0.5588607788085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,2,power_law_1.2,0.7297215938568116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,2,power_law_1.2,1.1374336242675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,2,power_law_1.2,1.3226688385009766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,2,power_law_1.2,2.035628890991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,balanced,17.870763142903645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,2,power_law_1.2,2.5946752548217775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,2,power_law_1.2,3.2339839935302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,2,power_law_1.2,5.456166458129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,2,power_law_1.2,10.55159683227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,2,power_law_1.2,0.06589440107345582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,2,power_law_1.2,0.0686464011669159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,2,power_law_1.2,0.07655680179595947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,2,power_law_1.2,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,2,power_law_1.2,0.10217599868774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,2,power_law_1.2,0.1399359941482544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,2,power_law_1.2,0.15425280332565308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,2,power_law_1.2,0.16088320016860963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,2,power_law_1.2,0.16663680076599122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,2,power_law_1.2,0.17151999473571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,2,power_law_1.2,0.18979840278625487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,2,power_law_1.2,0.2023103952407837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,balanced,0.07100266714890797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,2,power_law_1.2,0.21608319282531738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,2,power_law_1.2,0.241158390045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,balanced,0.07022933165232341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,balanced,0.0888853371143341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,2,power_law_1.2,0.2586047887802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,balanced,0.12778133153915405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,balanced,0.20301334063212076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,balanced,0.2572159965833028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,balanced,0.26050132513046265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,2,power_law_1.2,0.26835200786590574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,balanced,0.25726399819056195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,balanced,0.26074665784835815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,balanced,0.265882670879364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,balanced,0.2704640030860901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,2,power_law_1.2,0.31078400611877444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,balanced,0.2780906756718953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,balanced,0.2812959949175517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,balanced,0.2911786635716756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,2,power_law_1.2,0.39096319675445557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,balanced,0.3057439923286438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,2,power_law_1.2,0.48158721923828124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,balanced,0.35181868076324463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,balanced,0.33081066608428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,2,power_law_1.2,0.6368703842163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,balanced,0.4757973353068034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,balanced,0.05859733124574026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,2,power_law_1.2,0.7995327949523926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,balanced,0.4231040080388387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,2,power_law_1.2,1.158732795715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,balanced,0.06162666777769724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,2,power_law_1.2,1.500051212310791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,balanced,0.0745119998852412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,balanced,0.5534079869588217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,2,power_law_1.2,2.101587104797363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,balanced,0.10520533720652263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,2,power_law_1.2,2.9933311462402346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,balanced,0.16033599774042764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,balanced,0.6212639808654785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,balanced,0.19014400243759155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,2,power_law_1.2,4.104576110839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,balanced,0.19344000021616617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,balanced,0.19779199361801147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,2,power_law_1.2,5.160044860839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,balanced,0.9574133555094401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,balanced,0.2030400037765503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.06939520239830017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,balanced,0.20141865809758505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,2,power_law_1.2,7.118879699707032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,balanced,0.20388267437616983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.06581760048866273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,balanced,1.1824586391448975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.07938560247421264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,balanced,0.20755734046300253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,2,power_law_1.2,11.000109100341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.10467840433120727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,balanced,0.21954667568206787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.13178240060806273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,balanced,0.22823466857274374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.20061440467834474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,balanced,0.24168533086776733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,balanced,1.7663200696309407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,2,power_law_1.2,23.897990417480468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.20758399963378907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,balanced,0.2582719922065735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.01,0.05742080211639404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.2261631965637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,balanced,0.281765341758728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.23858559131622314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.01,0.05720319747924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,balanced,0.43406931559244794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.248307204246521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.01,0.06600959897041321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,balanced,0.35983999570210773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,balanced,2.244032065073649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.01,0.08866559863090515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.2534271955490112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,balanced,0.46278401215871173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.01,0.10234240293502808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.2625152111053467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.01,0.15093120336532592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,balanced,0.5227413177490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.27869439125061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.01,0.16984959840774536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.3042623996734619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,balanced,0.8666559855143229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.01,0.17306239604949952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.32727038860321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,balanced,3.3117653528849282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.01,0.18108160495758058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.35971839427948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.01,0.18832000494003295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,balanced,1.0660853385925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.36897280216217043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.01,0.20035200119018554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.01,0.21639039516448974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.4680768013000488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.01,0.22514560222625732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.4633664131164551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,balanced,1.6404213905334473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.01,0.23912959098815917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.5821375846862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.01,0.2566400051116943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.6700352191925049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.01,0.28296959400177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,balanced,4.015520095825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.01,0.32074880599975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.8895296096801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,balanced,2.0847999254862466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.01,0.3978368043899536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.01,1.1321599960327149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.01,0.39393279552459715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.01,1.6211135864257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.01,0.49032320976257326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.01,2.078976058959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.01,0.6046592235565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.06863359808921814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.01,0.8054911613464355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.01,3.124812889099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.01,1.0445055961608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,balanced,3.1018667221069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.061286401748657224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.01,3.997292709350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.07624959945678711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.01,1.5036479949951171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.0958400011062622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.01,5.0561473846435545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,balanced,4.896138509114583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.01,1.9179840087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.12347520589828491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.18602240085601807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.01,2.922559928894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.01,8.187430572509765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.21390719413757325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.01,3.687763214111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.23129599094390868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.2424448013305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.01,4.642144012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.01,16.339999389648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.24846720695495605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.2596544027328491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,balanced,3.79586124420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.01,7.77352294921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.27182080745697024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.2878079891204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.3108992099761963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.01,15.590118408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.34415359497070314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.368723201751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.3720832109451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.4732672214508057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.47450881004333495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.5897024154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.6802495956420899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,balanced,8.048432032267252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,balanced,4.659951845804851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.9156288146972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,1,power_law_1.2,1.1501248359680176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,1,power_law_1.2,1.6624895095825196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,1,power_law_1.2,2.1245887756347654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,1,power_law_1.2,3.165331268310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,1,power_law_1.2,4.077228927612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,1,power_law_1.2,5.1959999084472654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,1,power_law_1.2,8.224339294433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,power_law_1.2,16.3204345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,balanced,7.697498957316081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,1,balanced,16.425669352213543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,1,power_law_1.2,0.05232639908790589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,1,power_law_1.2,0.05498239994049072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,1,power_law_1.2,0.06366080045700073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,1,power_law_1.2,0.08022400140762329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,1,power_law_1.2,0.10090240240097045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,1,power_law_1.2,0.15447039604187013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,balanced,15.653493245442709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,1,power_law_1.2,0.1648576021194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,1,power_law_1.2,0.1777151942253113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,1,power_law_1.2,0.1892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,1,power_law_1.2,0.19018880128860474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,1,power_law_1.2,0.20356481075286864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,1,power_law_1.2,0.2246079921722412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,1,power_law_1.2,0.23708798885345458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,1,power_law_1.2,0.2428607940673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,1,power_law_1.2,0.2670783996582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,1,power_law_1.2,0.2866879940032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,1,power_law_1.2,0.319488000869751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,1,power_law_1.2,0.40263681411743163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,1,power_law_1.2,0.4037439823150635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,1,power_law_1.2,0.5037375926971436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,1,power_law_1.2,0.6199935913085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,1,power_law_1.2,0.8423808097839356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,1,power_law_1.2,1.070035171508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,1,power_law_1.2,1.5586112022399903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,1,power_law_1.2,1.9588607788085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,1,power_law_1.2,2.981318473815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,1,power_law_1.2,3.8214462280273436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,1,power_law_1.2,4.8337665557861325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,1,power_law_1.2,7.755820465087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,balanced,0.19928000370661417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,balanced,0.1920586625734965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,balanced,0.1911946733792623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,1,power_law_1.2,15.312991333007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,balanced,0.3499786853790283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,balanced,0.6661760012308756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,balanced,1.25272003809611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,balanced,1.8073919614156086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,balanced,1.9304107030232747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,balanced,1.9097919464111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,balanced,0.1211946705977122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,balanced,1.9635839462280273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,balanced,0.12019733587900798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,balanced,1.853482723236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,balanced,0.12372266252835591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,balanced,1.88481601079305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,balanced,0.21157334248224893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,balanced,1.7707626024882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,balanced,0.3803146680196126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,balanced,0.6932053565979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,balanced,1.8563626607259114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,balanced,1.0140746434529622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,balanced,1.868735949198405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,balanced,0.9403893152872721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,balanced,1.9486400286356609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,balanced,0.9320533275604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,balanced,1.8351999918619792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,balanced,0.9584213097890218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,balanced,0.05835199852784475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,balanced,1.9207146962483723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,balanced,1.0700053373972576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,balanced,1.0271093050638835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,balanced,1.7991520563761394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,balanced,0.05641066531340281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,balanced,0.9555199940999349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,balanced,0.059690664211908974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,balanced,1.7354772885640461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,balanced,0.07996266583601634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,balanced,0.9801493485768636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.01,1.2369088172912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,balanced,0.11407466729482015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,balanced,0.9247626463572184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,balanced,0.16059199968973795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,balanced,1.740298589070638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.01,1.778816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,balanced,0.9487786293029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,balanced,0.2192479968070984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,balanced,0.9373066425323486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,balanced,0.2205173373222351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.01,1.768057632446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,balanced,0.22106132904688516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,balanced,1.598629315694173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,balanced,0.9743200143178304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.01,0.5776256084442138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,balanced,0.22124266624450684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.01,0.8117312431335449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,balanced,1.09279465675354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.01,1.0097984313964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,balanced,0.22294400135676065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,balanced,1.4832852681477864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.01,1.2215295791625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,balanced,0.9642186959584554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.01,1.4637311935424804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,balanced,0.2257173260052999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.01,1.4397120475769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,balanced,0.9960693518320719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.01,1.6045440673828124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,balanced,0.22671999533971152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,balanced,1.1201279958089192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.01,1.6432960510253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,balanced,0.960752010345459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,balanced,0.22964799404144287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.01,1.5799872398376464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.01,1.7309120178222657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,balanced,0.23815999428431192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,balanced,0.9226506551106771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.01,1.6841535568237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,balanced,3.102405230204264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.7034048080444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.01,1.5125951766967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,balanced,0.23853333791097006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.01,1.571174430847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.01,0.9886272430419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,balanced,0.24567466974258423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.01,1.4858880043029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,balanced,0.769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.01,1.0099519729614257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.01,1.5269951820373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,balanced,0.2592746615409851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.312825608253479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.01,1.6858688354492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.4781631946563721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,balanced,2.2538506189982095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.01,2.0378047943115236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.5684607982635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,balanced,1.8416159947713215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.01,2.106937599182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.6720895767211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.01,2.5897151947021486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,balanced,0.2744053403536479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.800601577758789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.01,3.1005376815795898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.7825535774230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.01,4.011167907714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.7872064113616943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,balanced,1.4504586855570476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,balanced,4.054394721984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.7898176193237305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.01,4.958617782592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.7958720207214356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.01,6.664588928222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.8386303901672363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.01,9.612467193603516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,balanced,0.2974506616592407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.8963775634765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.839686393737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,balanced,0.32123732566833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.01,10.788614654541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.8530048370361328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,balanced,2.5041759808858237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.7760640144348144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,power_law_1.01,0.1831936001777649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,balanced,0.36508798599243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.01,16.103846740722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.8542592048645019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,balanced,5.761679967244466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,power_law_1.01,0.21813759803771973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,1.012230396270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,power_law_1.01,0.2134848117828369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,1.0306367874145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,power_law_1.01,0.0910975992679596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,1.1596863746643067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.01,35.95272216796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,power_law_1.01,0.11392639875411988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,power_law_1.01,0.14276479482650756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,1.4733375549316405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,power_law_1.01,0.171833598613739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,balanced,0.4161813259124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,1.6038143157958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,power_law_1.01,0.18546559810638427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,power_law_1.01,0.18151040077209474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,balanced,3.4535786310831704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,2.146393585205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,power_law_1.01,0.19214080572128295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,power_law_1.01,0.19471360445022584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,balanced,0.5080106655756632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,2.6365184783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,power_law_1.01,0.19928959608078003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,3.5269054412841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,32,power_law_1.2,1.2443455696105956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,power_law_1.01,0.209881591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,power_law_1.01,0.22930560111999512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,4.9150337219238285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,32,power_law_1.2,1.776857566833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,power_law_1.01,0.23215999603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,32,power_law_1.2,1.5989439964294434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,power_law_1.01,0.23923840522766113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.01,5.54461441040039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,balanced,8.291151682535807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,power_law_1.01,0.2664639949798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,32,power_law_1.2,0.5172607898712158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,power_law_1.01,0.32106239795684816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,32,power_law_1.2,0.7967679977416993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.01,9.416947174072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,balanced,0.6781866550445557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,32,power_law_1.2,1.0469568252563477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.7221951961517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,32,power_law_1.2,1.1397760391235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.01,0.3351936101913452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,32,power_law_1.2,1.0418496131896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.01,18.02447967529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,32,power_law_1.2,1.418668842315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.8500479698181153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,balanced,5.025904019673665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,32,power_law_1.2,1.3278847694396974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.28105599880218507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.01,0.35658879280090333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,32,power_law_1.2,1.513145637512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,balanced,0.869861364364624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.4586495876312256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.01,0.41790080070495605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,32,power_law_1.2,1.5191103935241699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.4983232021331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.01,0.5407487869262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,32,power_law_1.2,1.4087424278259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.46340479850769045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,32,power_law_1.2,1.480793571472168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.01,0.6437888145446777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.7849599838256835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,32,power_law_1.2,1.4930368423461915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.01,0.7982592105865478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.8045056343078614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,32,power_law_1.2,1.4734208106994628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.7744319915771485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.01,1.2091456413269044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,32,power_law_1.2,1.5054207801818849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.7173376083374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,balanced,1.1791840394337971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.8111616134643554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,32,power_law_1.2,1.6097536087036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.01,1.6819711685180665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.8386240005493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,32,power_law_1.2,1.757868766784668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.01,2.11409912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.8607999801635742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,32,power_law_1.2,1.9444095611572265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,power_law_1.01,2.607980728149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.8528896331787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,32,power_law_1.2,2.3097728729248046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.8784319877624511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,power_law_1.01,4.26561279296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,32,power_law_1.2,2.385331153869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.8502847671508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,32,power_law_1.2,3.1475648880004883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.9184384346008301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,power_law_1.01,8.4172607421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,balanced,1.4846347173055012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,32,power_law_1.2,3.6697792053222655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,1.042630386352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,balanced,14.301029205322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,1.2614656448364259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,32,power_law_1.2,4.975155258178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,1.4497535705566407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,32,power_law_1.2,6.529273223876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,1.6489919662475585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,32,power_law_1.2,11.340652465820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,2.2494911193847655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,balanced,8.775541305541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,32,power_law_1.2,11.98268814086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,2.8923648834228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,3.3599361419677733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,32,power_law_1.2,14.415379333496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,5.0571136474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,6.787820434570312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,32,power_law_1.2,23.784307861328124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,balanced,2.300656000773112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,32,power_law_1.2,7.6468864440917965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,32,power_law_1.2,12.495475006103515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,32,power_law_1.2,54.567376708984376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,32,power_law_1.2,32.529779052734376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,32,power_law_1.2,0.18358399868011474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,balanced,4.508576075236003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,32,power_law_1.2,0.21800320148468016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,32,power_law_1.2,0.14542720317840577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,32,power_law_1.2,0.08900480270385742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,32,power_law_1.2,0.11174399852752685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,32,power_law_1.2,0.13909120559692384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,32,power_law_1.2,0.1404096007347107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,32,power_law_1.2,0.18078720569610596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,32,power_law_1.2,0.185971200466156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,32,power_law_1.2,0.19048960208892823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,balanced,0.06588799754778545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,32,power_law_1.2,0.18317439556121826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,32,power_law_1.2,0.20407040119171144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,balanced,0.06136533121267954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,32,power_law_1.2,0.19429759979248046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,balanced,0.07231999933719635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,32,power_law_1.2,0.21794559955596923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,balanced,0.10532266894976298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,32,power_law_1.2,0.25119359493255616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,balanced,0.1607360045115153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,32,power_law_1.2,0.258950400352478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,balanced,0.2691413362820943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,32,power_law_1.2,0.29212160110473634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,balanced,0.3859306573867798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,32,power_law_1.2,0.35078399181365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,balanced,0.39070932070414227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,balanced,0.3898666699727376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.2,0.3807231903076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,balanced,0.3905920187632243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,balanced,0.39474133650461835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,balanced,0.39660267035166424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,balanced,0.396346648534139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.2,0.4103360176086426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,balanced,0.398693323135376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.2,0.45391359329223635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,balanced,0.40602131684621173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.2,0.6287744045257568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,balanced,0.4076746702194214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,balanced,0.4157866636912028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.2,0.7178751945495605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,balanced,0.42642664909362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.2,1.0065088272094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,balanced,0.44139734903971356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,balanced,0.05057600140571594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.2,1.353171157836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,balanced,0.05230399966239929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,balanced,0.4628213246663411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,balanced,0.05755733450253805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.2,2.0175296783447267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,balanced,0.07740800082683563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,balanced,0.48349865277608234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,balanced,0.10656533638636272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.2,2.615897560119629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,balanced,0.16363733013470969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,32,power_law_1.2,3.2677375793457033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,balanced,0.2230666677157084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,balanced,0.5235946575800577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,balanced,0.22395733992258707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,32,power_law_1.2,6.024537658691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,balanced,0.22441067298253378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,balanced,0.22564800580342612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,balanced,0.5718773206075033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,balanced,0.22765866915384927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,32,power_law_1.2,11.636083221435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,balanced,0.2300800085067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.01,0.16632319688796998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,balanced,0.23203732570012411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,balanced,0.23406932751337686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,balanced,0.6487146615982056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.01,0.26963200569152834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,balanced,0.2425866723060608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.01,0.3787264108657837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,balanced,0.049269333481788635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,balanced,0.2448800007502238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.01,0.11651840209960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,balanced,0.049584001302719116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,balanced,0.25262399514516193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.01,0.1090880036354065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,balanced,0.06066133578618368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.01,0.1657855987548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,balanced,0.7613706588745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,balanced,0.2688426574071248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,balanced,0.0812906672557195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.01,0.20709760189056398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.01,0.15746560096740722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,balanced,0.11610133449236552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,balanced,0.28294400374094647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.01,0.2123136043548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.01,0.24245760440826417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,balanced,0.16142400105794272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,balanced,0.2188160022099813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.01,0.08488960266113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,balanced,0.3097280065218608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.01,0.3019903898239136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,balanced,0.22057600816090903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.01,0.3173504114151001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.01,0.1118016004562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,balanced,0.22071999311447144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,balanced,0.3410986661911011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,balanced,0.9200159708658854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,balanced,0.2213653326034546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.01,0.3178688049316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.01,0.13038719892501832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,balanced,0.2243946592013041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.01,0.3030143976211548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,balanced,0.3950986862182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.01,0.15557119846343995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,balanced,0.2265226642290751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.01,0.29791998863220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,balanced,0.22857600450515747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.01,0.17909760475158693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,balanced,0.23233066002527872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.01,0.3212671995162964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.01,0.18301440477371217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,balanced,0.45019733905792236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,balanced,0.24035733938217163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.01,0.31612799167633054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.01,0.18568960428237916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,balanced,0.24242132902145386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.01,0.35053439140319825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.01,0.19748480319976808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,balanced,1.1954452991485596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,balanced,0.25064533948898315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.01,0.3955391883850098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,balanced,0.5531040032704672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.01,0.18511359691619872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,balanced,0.2676053245862325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.01,0.4086400032043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.01,0.1938752055168152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.01,0.4299647808074951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,power_law_1.01,0.11775360107421876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.01,0.21583359241485595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.01,0.4479423999786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.01,0.21852800846099854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,power_law_1.01,0.16814080476760865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,balanced,0.6806240081787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.01,0.23442559242248534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.01,0.49684481620788573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,power_law_1.01,0.22371199131011962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,balanced,0.2840320070584615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.01,0.23597440719604493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,power_law_1.01,0.09504640102386475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.01,0.5402560234069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.01,0.26759040355682373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,power_law_1.01,0.10688639879226684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.01,0.666099214553833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,balanced,1.4343679745992024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,power_law_1.01,0.14069759845733643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.01,0.26751999855041503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.01,0.7386496067047119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,balanced,0.895423968633016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,power_law_1.01,0.1550528049468994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.01,0.33272318840026854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.01,1.0005248069763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,power_law_1.01,0.1812991976737976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.01,0.3733567953109741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.01,1.064633560180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,power_law_1.01,0.17424000501632692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.01,0.48640642166137693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,balanced,0.3148533304532369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.01,1.4848320007324218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,power_law_1.01,0.18405760526657106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.01,0.5107135772705078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,balanced,0.3449173370997111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,power_law_1.01,0.19729280471801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.01,1.7640960693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.01,0.6955840110778808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,16,power_law_1.2,0.17031680345535277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,power_law_1.01,0.20908160209655763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.01,0.8425215721130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.01,2.11396484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,balanced,0.4084693193435669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,balanced,1.1696320374806721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,16,power_law_1.2,0.268339204788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,power_law_1.01,0.21380479335784913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.01,1.1630271911621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.01,3.3320960998535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,16,power_law_1.2,0.2139456033706665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,power_law_1.01,0.22545280456542968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.01,1.5674176216125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,16,power_law_1.2,0.11331199407577515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,power_law_1.01,0.22938880920410157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.01,5.898342514038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.01,1.9556095123291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,16,power_law_1.2,0.14408960342407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,power_law_1.01,0.22918400764465333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,16,power_law_1.2,0.16522879600524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,balanced,2.109205404917399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.01,2.830860710144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,power_law_1.01,0.2651007890701294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,balanced,0.484661340713501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,16,power_law_1.2,0.23454720973968507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,power_law_1.01,0.32467200756073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,16,power_law_1.2,0.2995199918746948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.01,5.613100814819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,16,power_law_1.2,0.2891648054122925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,balanced,0.6115893522898356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,16,power_law_1.2,0.28701438903808596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,balanced,1.4693439801534016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,power_law_1.01,0.33420159816741946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,16,power_law_1.2,0.3159424066543579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,16,power_law_1.2,0.3200000047683716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,16,power_law_1.2,0.33518080711364745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,16,power_law_1.2,0.3640255928039551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,power_law_1.01,0.34986879825592043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,balanced,0.8131306966145834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,16,power_law_1.2,0.36163198947906494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,power_law_1.01,0.4535359859466553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,16,power_law_1.2,0.38940160274505614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,16,power_law_1.2,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,power_law_1.01,0.5773375988006592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,16,power_law_1.2,0.4386752128601074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,16,power_law_1.2,0.46273279190063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,power_law_1.01,0.6758528232574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,16,power_law_1.2,0.5572671890258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,power_law_1.01,0.9624383926391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,16,power_law_1.2,0.5701183795928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,balanced,1.0671253204345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,16,power_law_1.2,0.7691008090972901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,power_law_1.01,1.121190357208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,16,power_law_1.2,0.8326527595520019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,power_law_1.01,1.7184959411621095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,16,power_law_1.2,1.0033087730407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,balanced,2.159898598988851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,16,power_law_1.2,1.2547967910766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,power_law_1.01,2.1943679809570313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,16,power_law_1.2,1.6300416946411134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,power_law_1.01,2.5729408264160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,16,power_law_1.2,2.309612846374512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,power_law_1.01,4.369862365722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,16,power_law_1.2,2.9630783081054686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,balanced,1.4350132942199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,16,power_law_1.2,3.6946880340576174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,power_law_1.01,8.690995025634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,power_law_1.2,8.041741180419923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,16,balanced,4.094256083170573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,16,power_law_1.2,0.10871679782867431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,balanced,1.8041493097941081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,16,power_law_1.2,0.15831680297851564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,16,power_law_1.2,0.15355520248413085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,16,power_law_1.2,0.09039999842643738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,16,power_law_1.2,0.09853439927101135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,16,power_law_1.2,0.13306879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,16,power_law_1.2,0.1415168046951294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,16,power_law_1.2,0.1687551975250244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,16,power_law_1.2,0.17438080310821533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,16,power_law_1.2,0.18209919929504395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,16,power_law_1.2,0.18305920362472533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,16,power_law_1.2,0.20037760734558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,16,power_law_1.2,0.19263360500335694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,16,power_law_1.2,0.20510079860687255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,balanced,4.225045204162598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,16,power_law_1.2,0.22412800788879395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,balanced,2.8162558873494468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,16,power_law_1.2,0.24316799640655518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,16,power_law_1.2,0.2384255886077881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,16,power_law_1.2,0.2589440107345581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,16,power_law_1.2,0.29049599170684814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,16,power_law_1.2,0.35167360305786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,16,power_law_1.2,0.39365758895874026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,16,power_law_1.2,0.5154240131378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,16,power_law_1.2,0.611187219619751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,16,power_law_1.2,0.750489616394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,16,power_law_1.2,0.9477567672729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,16,power_law_1.2,1.3753151893615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,16,power_law_1.2,1.735308837890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,16,power_law_1.2,2.2680959701538086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,16,power_law_1.2,3.1993343353271486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,16,power_law_1.2,7.246931457519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,balanced,5.488608042399089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,balanced,0.05723733206590017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,balanced,0.07302933434645335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,balanced,0.07282133400440216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,16,power_law_1.2,0.11686400175094605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,balanced,0.10379733641942342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,16,power_law_1.2,0.16521600484848023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,balanced,0.1570186714331309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,16,power_law_1.2,0.13876479864120483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,balanced,0.27196266253789264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,16,power_law_1.2,0.07688959836959838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,balanced,0.38815999031066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,16,power_law_1.2,0.1003775954246521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,balanced,0.39185599486033124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,16,power_law_1.2,0.12536319494247436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,balanced,0.39158932367960614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,balanced,0.3945759932200114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,16,power_law_1.2,0.13289599418640136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,balanced,0.3947840134302775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,16,power_law_1.2,0.16320639848709106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,balanced,0.39716267585754395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,16,power_law_1.2,0.19100799560546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,balanced,0.40144534905751544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,balanced,0.40569599469502765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,16,power_law_1.2,0.18300800323486327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,balanced,0.41326932112375897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,16,power_law_1.2,0.1903872013092041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,balanced,0.41650664806365967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,16,power_law_1.2,0.19043840169906617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,balanced,0.427072008450826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,16,power_law_1.2,0.2038271903991699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,16,power_law_1.2,0.22202880382537843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,balanced,0.44281065464019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,16,power_law_1.2,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,balanced,0.45708266894022626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,16,power_law_1.2,0.2541759967803955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,balanced,0.4835626681645711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.01,0.10685440301895141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,16,power_law_1.2,0.2591423988342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,balanced,0.05676266551017761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.01,0.15355520248413085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,balanced,0.5153546730677286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,16,power_law_1.2,0.32556159496307374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,balanced,0.05759466687838236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.01,0.2595263957977295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,balanced,0.07709866762161255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,balanced,0.10731732845306396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.01,0.09620479941368103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,balanced,0.5740960041681925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,balanced,0.165583997964859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.01,0.1416640043258667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,16,power_law_1.2,0.3509696006774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,balanced,0.22576000293095908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.01,0.18487679958343506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,balanced,0.22609599431355795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,balanced,0.6354986826578776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.01,0.22687358856201173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,balanced,0.22669865687688193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.01,0.27463679313659667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,16,power_law_1.2,0.3908159971237183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,balanced,0.22802132368087769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,balanced,0.052629331747690834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.01,0.29051520824432375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,balanced,0.2327573299407959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,16,power_law_1.2,0.4719423770904541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,balanced,0.056458666920661926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.01,0.2974463939666748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,balanced,0.23452266057332358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,balanced,0.7486080328623453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.01,0.3158015966415405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,16,power_law_1.2,0.6320256233215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,balanced,0.06454933186372121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,balanced,0.23600000143051147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.01,0.32445440292358396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,balanced,0.08545600374539693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,balanced,0.23947733640670776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.01,0.33459200859069826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,balanced,0.11798933148384094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,16,power_law_1.2,0.7481535911560059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,balanced,0.24895999828974405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.01,0.3483392000198364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,balanced,0.16636266311009726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.01,0.34479360580444335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,16,power_law_1.2,1.0042048454284669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,balanced,0.25098133087158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,balanced,0.8699519634246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,balanced,0.22794665892918906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.01,0.36368000507354736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,balanced,0.2619679967562358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,16,power_law_1.2,1.3988160133361816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,balanced,0.22959999243418375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.01,0.3766016006469727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,balanced,0.23132266600926718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.01,0.40082559585571287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,balanced,0.27796266476313275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,16,power_law_1.2,1.9686464309692382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,balanced,0.23177067438761392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.01,0.4409471988677979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,balanced,0.29499200979868573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,balanced,0.23517332474390665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.01,0.49653120040893556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,16,power_law_1.2,2.7534271240234376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,balanced,0.23862399657567343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.01,0.5405119895935059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,balanced,0.3328213294347127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,balanced,1.0912799835205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.01,0.6543231964111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.01,0.07551360130310059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,balanced,0.24130133787790933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,16,power_law_1.2,3.6569087982177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.01,0.7121727943420411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,balanced,0.37293867270151776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,balanced,0.24493332703908285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.01,0.09960319995880126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.01,0.919711971282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,16,power_law_1.2,5.177497482299804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,balanced,0.2555413246154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.01,0.15221760272979737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.01,1.1014080047607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,balanced,0.44364798069000244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,balanced,0.2595946590105693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.01,1.4661888122558593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.01,0.08008959889411926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,balanced,0.2725546757380168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,16,power_law_1.2,10.632115173339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.01,1.8177791595458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,balanced,0.293722669283549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.01,0.09269760251045227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,balanced,0.5039306481679281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.01,2.156108856201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,balanced,1.3987414042154949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.01,0.1297727942466736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.01,3.27509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.01,0.1410048007965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,balanced,0.633296012878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.01,7.113868713378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.01,0.16990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,balanced,0.31710400183995563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.01,0.17689599990844726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.01,0.18215680122375488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,balanced,0.7931146621704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.01,0.19005440473556517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.01,0.20032639503479005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,balanced,1.720037301381429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,balanced,0.3798133134841919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.01,0.19368959665298463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,power_law_1.01,0.08751360177993775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.01,0.20719358921051026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,balanced,0.43292800585428876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,power_law_1.01,0.11273599863052368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.01,0.2131903886795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,balanced,1.0637760162353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,power_law_1.01,0.17455359697341918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.01,0.2274496078491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,balanced,0.5285919904708862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,power_law_1.01,0.07833600044250488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.01,0.23785600662231446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,power_law_1.01,0.10212479829788208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.01,0.2659392118453979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,power_law_1.01,0.13237119913101197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.01,0.2853055953979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,balanced,0.6387840112050375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,power_law_1.01,0.1486080050468445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.01,0.35635199546813967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,power_law_1.01,0.1750208020210266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.01,0.39388160705566405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,power_law_1.01,0.18277759552001954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,balanced,1.392730712890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,power_law_1.01,0.19905920028686525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,balanced,0.8235572973887125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.01,0.4939839839935303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,power_law_1.01,0.20302720069885255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.01,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,balanced,2.526282628377279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,power_law_1.01,0.20675199031829833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,8,power_law_1.2,0.10655360221862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.01,0.7523519992828369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,power_law_1.01,0.21137919425964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,8,power_law_1.2,0.15380480289459228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.01,0.9251456260681152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,power_law_1.01,0.21772160530090331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,balanced,1.1053386529286702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,8,power_law_1.2,0.11518720388412476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,power_law_1.01,0.2408384084701538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.01,1.2926464080810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,8,power_law_1.2,0.10392320156097412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,power_law_1.01,0.24671359062194825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.01,1.691744041442871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,power_law_1.01,0.2705215930938721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,8,power_law_1.2,0.12702720165252684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,balanced,1.697696050008138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,power_law_1.01,0.3273855924606323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,8,power_law_1.2,0.18169599771499634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.01,1.9838336944580077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,8,power_law_1.2,0.19436800479888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,balanced,1.471461296081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.01,2.9187007904052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,8,power_law_1.2,0.2695168018341064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,power_law_1.01,0.37842559814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,8,power_law_1.2,0.2880959987640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.01,6.0726783752441404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,8,power_law_1.2,0.29446399211883545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,power_law_1.01,0.4189568042755127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,8,power_law_1.2,0.3024127960205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,power_law_1.01,0.5044608116149902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,8,power_law_1.2,0.3073663949966431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,power_law_1.01,0.6425151824951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,8,power_law_1.2,0.3122495889663696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,power_law_1.01,0.7507264137268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,balanced,1.9913493792215984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,8,power_law_1.2,0.33345279693603513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,power_law_1.01,1.0869759559631347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,8,power_law_1.2,0.3367743968963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,power_law_1.01,1.4068608283996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,power_law_1.01,1.8313472747802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,8,power_law_1.2,0.3542207956314087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,balanced,2.553749402364095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,power_law_1.01,2.4941312789916994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,8,power_law_1.2,0.3711168050765991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,8,power_law_1.2,0.43566079139709474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,power_law_1.01,3.1485952377319335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,8,power_law_1.2,0.43198719024658205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,power_law_1.01,5.179059219360352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,8,power_law_1.2,0.5255424022674561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,balanced,2.5191946029663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,8,power_law_1.2,0.5496575832366943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,balanced,4.746517181396484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,power_law_1.01,10.024447631835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,8,power_law_1.2,0.6961023807525635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,8,power_law_1.2,0.7486080169677735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,8,power_law_1.2,1.0397695541381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,8,power_law_1.2,1.191500759124756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,8,power_law_1.2,1.697657585144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,8,power_law_1.2,1.9448896408081056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,8,power_law_1.2,2.6932416915893556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,8,power_law_1.2,4.295097732543946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,8,power_law_1.2,8.697990417480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,balanced,3.9262825647989907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,balanced,4.936810811360677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,8,power_law_1.2,0.0757311999797821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,8,power_law_1.2,0.09983360171318054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,8,power_law_1.2,0.10246399641036988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,8,power_law_1.2,0.07867519855499268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,8,power_law_1.2,0.09818239808082581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,8,power_law_1.2,0.08820480108261108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,8,power_law_1.2,0.11218559741973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,8,power_law_1.2,0.1334720015525818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,8,power_law_1.2,0.11289600133895875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,8,power_law_1.2,0.15329920053482055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,8,power_law_1.2,0.1714367985725403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,8,power_law_1.2,0.12050559520721435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,8,power_law_1.2,0.17191679477691652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,8,power_law_1.2,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,8,power_law_1.2,0.1879744052886963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,8,power_law_1.2,0.19567359685897828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,8,power_law_1.2,0.09641600251197815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,8,power_law_1.2,0.19690879583358764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,balanced,7.669333140055339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,8,power_law_1.2,0.21640961170196532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,8,power_law_1.2,0.1272320032119751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,8,power_law_1.2,0.22880640029907226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,8,power_law_1.2,0.14312959909439088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,8,power_law_1.2,0.22986240386962892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,8,power_law_1.2,0.24335360527038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,8,power_law_1.2,0.16826879978179932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,8,power_law_1.2,0.26867198944091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,8,power_law_1.2,0.2983871936798096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,8,power_law_1.2,0.18542720079421998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,8,power_law_1.2,0.35192320346832273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,8,power_law_1.2,0.17923840284347534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,8,power_law_1.2,0.39580159187316893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,8,power_law_1.2,0.18951679468154908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,8,power_law_1.2,0.5221248149871827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,8,power_law_1.2,0.6016255855560303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,8,power_law_1.2,0.20780160427093505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,8,power_law_1.2,0.800102424621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,8,power_law_1.2,0.20551040172576904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,8,power_law_1.2,0.9771903991699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,8,power_law_1.2,0.2226560115814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,8,power_law_1.2,1.4009471893310548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,8,power_law_1.2,0.2458240032196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,8,power_law_1.2,1.8315839767456055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,8,power_law_1.2,0.2491391897201538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,8,power_law_1.2,2.3700096130371096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,8,power_law_1.2,0.26975359916687014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,8,power_law_1.2,3.7005630493164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,8,power_law_1.2,0.3220607995986938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,8,power_law_1.2,7.3327171325683596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,8,power_law_1.2,0.35111680030822756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,8,power_law_1.2,0.4474815845489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,8,power_law_1.2,0.5234687805175782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,balanced,0.05738133192062378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,8,power_law_1.2,0.7373568058013916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,8,power_law_1.2,0.893228816986084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,balanced,0.06216000020503998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,8,power_law_1.2,1.1400511741638184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,balanced,0.07267199953397115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,8,power_law_1.2,1.5285504341125489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,balanced,0.10611200332641602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,balanced,0.16375466187795004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,8,power_law_1.2,2.3208831787109374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,balanced,0.2764693299929301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,balanced,0.39660267035166424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,8,power_law_1.2,2.962156867980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,balanced,0.39815465609232586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,balanced,0.05027733246485392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,8,power_law_1.2,4.2780609130859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,balanced,0.3985919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,balanced,0.05268266797065735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,balanced,0.4029013315836589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,balanced,0.40808534622192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,balanced,0.05879466732343038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,8,power_law_1.2,5.8899070739746096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,balanced,0.41048534711201984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,balanced,0.07956266899903615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,balanced,0.4109119971593221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,balanced,0.1120693286259969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,balanced,0.4183359940846761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,8,power_law_1.2,10.595238494873048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,balanced,0.17361066738764444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,balanced,0.4257173140843709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,balanced,0.23306133349736533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,balanced,0.4310986598332723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,balanced,0.23629866043726602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,balanced,0.4389813343683879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,balanced,0.2370026707649231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,balanced,0.461082657178243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,balanced,0.24077334006627402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,balanced,0.47702399889628094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,balanced,0.24276266495386759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,balanced,0.5207146803538004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,balanced,0.2488480011622111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,balanced,0.2534666657447815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,balanced,0.5788266658782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,balanced,0.2574826677640279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,balanced,0.06781866649786632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,balanced,0.2704319953918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,balanced,0.6651306549708048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,balanced,0.07116800049940745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.01,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,balanced,0.2760266661643982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,balanced,0.07845866680145264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,balanced,0.2874720096588135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.01,0.10117119550704956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,balanced,0.7534826596577963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,balanced,0.09816533327102661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.01,0.15450880527496338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,balanced,0.31403199831644696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,balanced,0.13375999530156454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.01,0.10188800096511841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,balanced,0.33349867661794025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,balanced,0.18905067443847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,balanced,0.2529760003089905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,balanced,0.9400959809621176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.01,0.05811840295791626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.01,0.13939839601516724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,balanced,0.381717324256897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,balanced,0.25549866755803424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.01,0.07367039918899536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.01,0.1866688013076782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,balanced,0.2576213280359904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,balanced,0.4299573500951131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.01,0.10294400453567505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.01,0.20232319831848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,balanced,0.2594933311144511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.01,0.07314559817314148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,balanced,0.2632853388786316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,balanced,1.1197813351949055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.01,0.28112640380859377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,balanced,0.5129599968592325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,balanced,0.26820266246795654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.01,0.09548159837722778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.01,0.2827712059020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,balanced,0.2741706569989522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.01,0.12963199615478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.01,0.2990272045135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,balanced,0.28069865703582764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,balanced,0.6160693168640137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.01,0.14094079732894899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.01,0.3197184085845947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,balanced,0.2956426739692688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.01,0.17150720357894897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.01,0.3255359888076782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,balanced,0.3018186688423157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,balanced,1.5243199666341145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.01,0.18097920417785646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,balanced,0.8185280164082845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.01,0.3405888080596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,balanced,0.31851200262705487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.01,0.3498176097869873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.01,0.17989120483398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,balanced,0.3575040102005005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.01,0.367903995513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.01,0.1929471969604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.01,0.37745280265808107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.01,0.20275840759277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,balanced,1.013973315556844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.01,0.2128767967224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.01,0.38679039478302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,balanced,1.919541358947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.01,0.23001599311828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,balanced,0.4111200173695882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.01,0.4298240184783936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.01,0.24006400108337403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.01,0.4874559879302979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.01,0.24855680465698243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.01,0.5605440139770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.01,0.2560447931289673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,balanced,1.434922695159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.01,0.6073472023010253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.01,0.2971776008605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.01,0.7156735897064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.01,0.32992000579833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,balanced,0.5277013381322225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.01,0.39134080410003663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.01,0.8249600410461426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,balanced,0.617845336596171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.01,0.43722238540649416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,balanced,2.320021311442057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.01,1.0484288215637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.01,0.5444672107696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,power_law_1.01,0.08358399868011475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,balanced,0.7493279774983724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.01,1.3736703872680665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.01,0.647379207611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,balanced,1.83350404103597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,power_law_1.01,0.09594879746437072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.01,1.8648448944091798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.01,0.86627197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,power_law_1.01,0.12899839878082275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,balanced,0.9628000259399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,power_law_1.01,0.09071999788284302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.01,1.0608192443847657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.01,2.0497791290283205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,power_law_1.01,0.111571204662323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,power_law_1.01,0.14302719831466676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.01,1.5438719749450684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.01,2.717715263366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,power_law_1.01,0.1563199996948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,balanced,1.2512426376342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.01,1.973574447631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,power_law_1.01,0.19913599491119385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.01,4.064153671264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,power_law_1.01,0.2042304039001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.01,2.55546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,power_law_1.01,0.2088831901550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.01,3.7566913604736327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,power_law_1.01,0.2129472017288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.01,7.983609771728515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,balanced,2.233760039011637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,power_law_1.01,0.23082239627838136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,4,power_law_1.2,0.07415680289268493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,power_law_1.01,0.24060161113739015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,balanced,1.7590346336364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.01,7.754611206054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,4,power_law_1.2,0.10092159509658813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,power_law_1.01,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,balanced,3.4128799438476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,4,power_law_1.2,0.09815679788589478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,power_law_1.01,0.2933759927749634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,power_law_1.01,0.3101696014404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,4,power_law_1.2,0.08317440152168273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,power_law_1.01,0.3283519983291626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,4,power_law_1.2,0.12341760396957398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,power_law_1.01,0.40979838371276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,4,power_law_1.2,0.17004159688949586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,balanced,2.3874826431274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,4,power_law_1.2,0.19584640264511108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,power_law_1.01,0.4728896141052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,4,power_law_1.2,0.271347188949585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,4,power_law_1.2,0.27681920528411863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,power_law_1.01,0.5514304161071777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,4,power_law_1.2,0.27565441131591795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,power_law_1.01,0.6673408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,4,power_law_1.2,0.2884223937988281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,balanced,3.3875732421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,power_law_1.01,0.9080703735351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,4,power_law_1.2,0.32851200103759765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,power_law_1.01,1.1253696441650392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,4,power_law_1.2,0.3408639907836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,balanced,3.208064079284668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,power_law_1.01,1.523532772064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,4,power_law_1.2,0.3504575967788696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,power_law_1.01,2.0097408294677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,4,power_law_1.2,0.3593728065490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,4,power_law_1.2,0.38506879806518557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,power_law_1.01,2.775507164001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,4,power_law_1.2,0.39918079376220705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,power_law_1.01,3.624665451049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,4,power_law_1.2,0.45481600761413576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,4,power_law_1.2,0.4985919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,power_law_1.01,4.8943744659423825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,4,power_law_1.2,0.584774398803711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,power_law_1.01,7.4936576843261715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,4,power_law_1.2,0.592902421951294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,4,power_law_1.2,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,balanced,3.994389216105143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,4,power_law_1.2,0.7566207885742188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,4,power_law_1.2,0.07343360185623168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,power_law_1.01,15.108242797851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,4,power_law_1.2,0.8214207649230957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,4,power_law_1.2,0.0765824019908905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,4,power_law_1.2,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,4,power_law_1.2,1.124672031402588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,balanced,6.660805384318034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,4,power_law_1.2,0.09560959935188293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,4,power_law_1.2,1.3936448097229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,4,power_law_1.2,0.1250048041343689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,4,power_law_1.2,2.0117824554443358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,4,power_law_1.2,0.13035520315170288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,4,power_law_1.2,2.2712448120117186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,4,power_law_1.2,0.16200319528579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,4,power_law_1.2,0.17203840017318725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,4,power_law_1.2,2.704806327819824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,4,power_law_1.2,0.17848960161209107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,4,power_law_1.2,4.588070297241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,4,power_law_1.2,0.19260799884796143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,4,power_law_1.2,0.19967999458312988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,4,power_law_1.2,9.475341033935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,4,power_law_1.2,0.20813438892364503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,balanced,6.243477503458659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,balanced,6.654858907063802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,4,power_law_1.2,0.22603518962860109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,4,power_law_1.2,0.23887999057769777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,4,power_law_1.2,0.2509376049041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,4,power_law_1.2,0.2642816066741943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,4,power_law_1.2,0.29655680656433103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,4,power_law_1.2,0.33692800998687744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,4,power_law_1.2,0.4090752124786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,4,power_law_1.2,0.4479487895965576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,4,power_law_1.2,0.574073600769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,4,power_law_1.2,0.6638783931732177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,4,power_law_1.2,0.9259455680847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,4,power_law_1.2,1.1313983917236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,4,power_law_1.2,1.5660096168518067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,4,power_law_1.2,2.0969152450561523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,4,power_law_1.2,2.839891242980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,4,power_law_1.2,4.4352256774902346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,4,power_law_1.2,8.172569274902344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,balanced,12.240107218424479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,balanced,0.06080533564090729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,balanced,0.06433066725730896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,balanced,0.0769706666469574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,balanced,0.11181867122650146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,4,power_law_1.2,0.08348159790039063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,balanced,0.17362133661905924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,balanced,0.29212266206741333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,4,power_law_1.2,0.09649279713630676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,balanced,0.4135520060857137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,4,power_law_1.2,0.09576320052146911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,balanced,0.41872533162434894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,balanced,0.4236746629079183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,4,power_law_1.2,0.09075199961662292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,balanced,0.4262186686197917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,4,power_law_1.2,0.11205120086669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,balanced,0.4246879816055298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,4,power_law_1.2,0.13657599687576294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,balanced,0.42926931381225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,4,power_law_1.2,0.15028480291366578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,balanced,0.4329226811726888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,4,power_law_1.2,0.1867967963218689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,balanced,0.4328213135401408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,4,power_law_1.2,0.189683198928833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,balanced,0.4430933396021525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,4,power_law_1.2,0.21300480365753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,balanced,0.4482986529668172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,balanced,0.47226134936014813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,4,power_law_1.2,0.217740797996521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,balanced,0.5091679890950521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,4,power_law_1.2,0.22810239791870118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,balanced,0.5369919935862223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,4,power_law_1.2,0.2342144012451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,balanced,0.6061280171076456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,4,power_law_1.2,0.2560767889022827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,4,power_law_1.2,0.29078400135040283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,balanced,0.7041973272959391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,4,power_law_1.2,0.30624639987945557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,4,power_law_1.2,0.3410304069519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,balanced,0.8326720396677653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,4,power_law_1.2,0.41729278564453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,balanced,0.05331199864546458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,balanced,1.0040799776713054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,4,power_law_1.2,0.4910143852233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,balanced,0.05646933118502299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,balanced,0.06491200129191081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,balanced,0.090037335952123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,balanced,0.12909866372744241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,balanced,1.345040003458659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,4,power_law_1.2,0.5694464206695556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,balanced,0.20483734210332236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,balanced,0.28277866045633954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,4,power_law_1.2,0.7085504055023193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,balanced,0.2839786609013875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,balanced,0.28730666637420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,4,power_law_1.2,0.9261119842529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,balanced,0.28887466589609784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,4,power_law_1.2,1.144486427307129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,balanced,0.29444799820582074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,balanced,1.65228271484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,balanced,0.09821866949399312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,balanced,0.3009706735610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,4,power_law_1.2,1.5643327713012696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,balanced,0.10371733705202739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,balanced,0.30611733595530194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,4,power_law_1.2,2.0976383209228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,balanced,0.3139839967091878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,balanced,0.1127786636352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,balanced,0.1318933367729187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,balanced,0.3272160092989604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,4,power_law_1.2,3.1190847396850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.01,0.05925120115280151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.01,0.06106240153312683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,balanced,0.17172267039616904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,balanced,0.33503464857737225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.01,0.0616703987121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,4,power_law_1.2,3.9943103790283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.01,0.07388160228729249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,balanced,0.24484266837437949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,balanced,2.360362688700358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.01,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,balanced,0.35761066277821857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,balanced,0.32151466608047485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.01,0.10436480045318604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.01,0.07794560194015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,4,power_law_1.2,5.464454269409179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,balanced,0.38809065024058026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,balanced,0.3272426724433899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.01,0.10252799987792968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.01,0.0896127998828888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,balanced,0.33168532450993854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,balanced,0.42056000232696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.01,0.1397696018218994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,4,power_law_1.2,7.453542327880859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.01,0.14268800020217895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,balanced,0.3367626667022705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.01,0.1579327940940857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,balanced,0.4919039805730184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.01,0.18583680391311647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,balanced,0.3447680075963338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.01,0.19969919919967652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,balanced,0.3546559810638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.01,0.2024319887161255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.01,0.2128767967224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,4,power_law_1.2,16.934719848632813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,balanced,0.5587466557820638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,balanced,0.36298668384552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.01,0.21590399742126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.01,0.2803584098815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,balanced,2.911168098449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,balanced,0.37628265221913654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.01,0.2266239881515503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.01,0.2960319995880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,balanced,0.39625600973765057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,balanced,0.6784586906433105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.01,0.23795840740203858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.01,0.30449280738830564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,balanced,0.40930132071177167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.01,0.25163519382476807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,balanced,0.4561706781387329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.01,0.3270143985748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.01,0.26703999042510984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,balanced,0.8555306593577067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.01,0.34298880100250245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,balanced,0.524346669514974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.01,0.28664960861206057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.01,0.34936959743499757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.01,0.31000959873199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.01,0.3816832065582275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.01,0.3119040012359619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,balanced,1.175114631652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.01,0.3912575960159302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.01,0.3682368040084839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.01,0.41185917854309084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,balanced,3.412869453430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,balanced,0.6220586697260538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.01,0.4098048210144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.01,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.01,0.5072768211364747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.01,0.4924160003662109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.01,0.5511104106903076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,balanced,1.5056053797403972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.01,0.5416959762573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.01,0.6483456134796143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.01,0.6971136093139648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.01,0.6962624073028565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.01,0.8380031585693359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,balanced,0.8179946740468343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,power_law_1.01,0.09671040177345276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.01,0.887980842590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.01,1.1446784019470215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.01,1.079526424407959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,power_law_1.01,0.10705280303955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,balanced,0.979744036992391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.01,1.5236991882324218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.01,1.3812735557556153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,balanced,2.179434617360433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,2,power_law_1.2,0.06179839968681335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,power_law_1.01,0.1261247992515564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.01,2.1631744384765623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.01,1.6760383605957032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,power_law_1.01,0.12259839773178101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,2,power_law_1.2,0.07367039918899536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,balanced,1.2082666556040447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.01,2.3113536834716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.01,2.760006332397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,power_law_1.01,0.15022720098495485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,2,power_law_1.2,0.07418879866600037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.01,2.904844856262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.01,3.2918846130371096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,power_law_1.01,0.1859392046928406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,2,power_law_1.2,0.09167360067367554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,balanced,1.6092267036437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.01,3.5680831909179687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,balanced,5.373226801554362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,power_law_1.01,0.20608000755310057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,2,power_law_1.2,0.12966400384902954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.01,5.164441680908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.01,5.582483291625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,power_law_1.01,0.23631999492645264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,2,power_law_1.2,0.16687999963760375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,balanced,2.5760159492492676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,power_law_1.01,0.25701758861541746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,balanced,2.1219894091288247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,2,power_law_1.2,0.19459840059280395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.01,11.37306900024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.01,11.706893157958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,power_law_1.01,0.2665600061416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,2,power_law_1.2,0.26968960762023925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,power_law_1.01,0.28039040565490725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,2,power_law_1.2,0.2887808084487915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,power_law_1.01,0.30141439437866213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,2,power_law_1.2,0.2959552049636841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,balanced,2.9877281188964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,power_law_1.01,0.31724159717559813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,2,power_law_1.2,0.30877439975738524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,power_law_1.01,0.3482048034667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,2,power_law_1.2,0.33902080059051515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,power_law_1.01,0.3691456079483032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,2,power_law_1.2,0.3457855939865112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,balanced,3.205162684122721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,power_law_1.01,0.40346240997314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,2,power_law_1.2,0.3797760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,balanced,4.064256032307942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,2,power_law_1.2,0.38708479404449464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,power_law_1.01,0.461740779876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,2,power_law_1.2,0.42435197830200194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,power_law_1.01,0.5809599876403808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,2,power_law_1.2,0.4349952220916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,2,power_law_1.2,0.4986432075500488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,power_law_1.01,0.6744256019592285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,2,power_law_1.2,0.5658880233764648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,2,power_law_1.2,0.6963583946228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,power_law_1.01,0.8392704010009766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,2,power_law_1.2,0.7419648170471191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,balanced,5.542853037516276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,2,power_law_1.2,0.9583680152893066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,power_law_1.01,1.046342372894287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,2,power_law_1.2,1.0774399757385253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,power_law_1.01,1.35863037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,2,power_law_1.2,1.4431167602539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,power_law_1.01,1.7299455642700194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,balanced,4.914880116780599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,2,power_law_1.2,1.7523008346557618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,balanced,10.73904037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,power_law_1.01,2.365817642211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,2,power_law_1.2,2.5267072677612306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,power_law_1.01,3.1127296447753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,2,power_law_1.2,2.986611175537109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,power_law_1.01,4.38485107421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,balanced,6.898405075073242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,2,power_law_1.2,3.9272705078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,power_law_1.01,5.834073638916015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,2,power_law_1.2,6.16798095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,power_law_1.01,7.4589378356933596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,power_law_1.01,11.48949737548828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,2,power_law_1.2,12.46258544921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,power_law_1.01,23.191853332519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,balanced,10.764383951822916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,2,power_law_1.2,0.05936639904975891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,2,power_law_1.2,0.06197119951248169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,balanced,10.153984069824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,2,power_law_1.2,0.06492800116539002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,2,power_law_1.2,0.07799680233001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,2,power_law_1.2,0.10149120092391968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,2,power_law_1.2,0.12896000146865844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,2,power_law_1.2,0.14444799423217775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,2,power_law_1.2,0.1865023970603943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,2,power_law_1.2,0.20156800746917725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,2,power_law_1.2,0.20592639446258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,2,power_law_1.2,0.2172032117843628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,2,power_law_1.2,0.23939199447631837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,2,power_law_1.2,0.245849609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,2,power_law_1.2,0.26737279891967775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,2,power_law_1.2,0.29015679359436036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,2,power_law_1.2,0.3096447944641113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,2,power_law_1.2,0.31573760509490967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,balanced,21.1070556640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,2,power_law_1.2,0.3769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,2,power_law_1.2,0.4148287773132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,2,power_law_1.2,0.5224703788757324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,2,power_law_1.2,0.5811327934265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,2,power_law_1.2,0.7456319808959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,2,power_law_1.2,0.9035072326660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,2,power_law_1.2,1.1960895538330079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,balanced,0.06684266527493794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,2,power_law_1.2,1.595244789123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,balanced,0.08577600121498108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,2,power_law_1.2,2.2550912857055665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,balanced,0.09567999839782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,balanced,0.1327946682771047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,2,power_law_1.2,2.9083200454711915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,2,power_law_1.2,0.09649919867515563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,balanced,0.20383999745051065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,balanced,0.3370506763458252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,2,power_law_1.2,0.10693119764328003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,2,power_law_1.2,3.388889694213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,balanced,0.476800004641215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,2,power_law_1.2,0.1159168004989624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,balanced,0.4886666536331177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,2,power_law_1.2,0.12383359670639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,2,power_law_1.2,5.487225723266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,balanced,0.49453334013621014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,2,power_law_1.2,0.14692480564117433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,balanced,0.4970719814300537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,2,power_law_1.2,0.17277439832687377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,balanced,0.4927786588668823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,2,power_law_1.2,11.562662506103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,2,power_law_1.2,0.19544320106506347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,balanced,0.503104011217753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,2,power_law_1.2,0.23383679389953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,balanced,0.5088586807250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,2,power_law_1.2,0.2569535970687866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,balanced,0.5183733304341634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,2,power_law_1.2,0.27007360458374025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,balanced,0.5314986705780029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,2,power_law_1.2,0.2859711885452271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,balanced,0.538271983464559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,2,power_law_1.2,0.3032383918762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,balanced,0.5611413319905599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,2,power_law_1.2,0.31526401042938235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,balanced,0.6221173206965128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,2,power_law_1.2,0.34565119743347167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,balanced,0.6712533632914225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,2,power_law_1.2,0.3731391906738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,2,power_law_1.2,0.4023104190826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,balanced,0.7878506978352865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,2,power_law_1.2,0.4740096092224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,balanced,0.0617386649052302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,2,power_law_1.2,0.5890431880950928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,balanced,0.9656960169474283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,balanced,0.07044266661008199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,balanced,0.08167999982833862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,balanced,0.11614400148391724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,balanced,0.1725333333015442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,balanced,1.199893315633138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,2,power_law_1.2,0.6856319904327393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,balanced,0.28649600346883136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,balanced,0.39738667011260986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,balanced,0.4012853304545085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,balanced,1.511642615000407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,balanced,0.3998719851175944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,2,power_law_1.2,0.8425600051879882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,balanced,0.40572798252105713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,2,power_law_1.2,1.0516223907470703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,balanced,0.4118560155232747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,2,power_law_1.2,1.427667236328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,balanced,0.41701332728068036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,balanced,2.1332799593607583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,2,power_law_1.2,1.7966079711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,balanced,0.4223039944966634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,balanced,0.4336800177892049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,2,power_law_1.2,2.495251274108887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,balanced,0.44730134805043537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,2,power_law_1.2,3.0959423065185545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,balanced,0.4558986822764079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,balanced,2.7166932423909507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,2,power_law_1.2,4.598809432983399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,balanced,0.48479998111724854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,balanced,0.5273386637369791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,2,power_law_1.2,5.873267364501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,balanced,0.6057440042495728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.06119679808616638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,2,power_law_1.2,7.806969451904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,balanced,0.7131466865539551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.0926912009716034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,balanced,0.8374293645222982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,2,power_law_1.2,11.767929840087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,balanced,3.899418512980143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.11145600080490112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.15897599458694459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,balanced,1.043610652287801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.2128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,2,power_law_1.2,24.414944458007813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.25299839973449706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.32940800189971925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,balanced,1.3574132919311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.34920320510864256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.0555840015411377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.3595968008041382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.3791232109069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,balanced,4.749706586201985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.06663039922714234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,balanced,1.898848056793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.40506877899169924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.07834879755973816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.41646718978881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.09609599709510804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.44084482192993163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.13953919410705568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.463699197769165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,balanced,2.4952905972798667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.19040640592575073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.47786879539489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.5258624076843261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.21388800144195558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.6169727802276611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.27445120811462403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,balanced,5.874538421630859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.01,3.024281692504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.2841408014297485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.01,3.647129440307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.9704447746276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.29112958908081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,balanced,3.638186772664388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.01,1.2284159660339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.31067519187927245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.01,1.508364772796631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.33752319812774656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.01,2.0721408843994142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.3504256010055542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.01,2.533119964599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.3764415979385376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.01,3.6396224975585936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,balanced,4.3192853927612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.40869760513305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.01,4.64384651184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.4356351852416992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.01,5.649862289428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,balanced,8.651088078816732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.01,8.764115142822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.44664959907531737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.01,0.5419007778167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.01,19.340786743164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,0.6182464122772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,0.7735295772552491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,balanced,5.397829055786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,0.8333696365356446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,1.062169647216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,1.3075776100158691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,1.8155071258544921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,2.3516416549682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,3.428793716430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,4.293817520141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.01,5.281491088867187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,balanced,8.458255767822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.0611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.08145920038223267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.01,8.186483001708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.08513919711112976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.10988160371780395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.1455296039581299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.01,18.38970184326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.19864319562911986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.22894079685211183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,balanced,18.702592213948567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.31400959491729735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.3370687961578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.35086081027984617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.3637120008468628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.3816447973251343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.4041152000427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.4366911888122559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.4633791923522949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.4785600185394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.5376319885253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.6405504226684571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,1,power_law_1.2,3.0609535217285155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,1,power_law_1.2,3.941350555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.9992639541625976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,1,power_law_1.2,1.2764991760253905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,1,power_law_1.2,1.580198383331299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,1,power_law_1.2,2.1168256759643556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,1,power_law_1.2,2.596518325805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,balanced,17.667994181315105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,1,power_law_1.2,3.716633605957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.055430400371551516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,1,power_law_1.2,4.618399810791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.06666240096092224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,1,power_law_1.2,5.641024017333985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.07139840126037597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,1,power_law_1.2,8.787142181396485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.09475200176239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.1309823989868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,1,power_law_1.2,18.914341735839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.16872960329055786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.20085759162902833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.25656321048736574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.27289600372314454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.28270080089569094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.303219199180603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.3339008092880249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.3572544097900391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.37465600967407225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.4115903854370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.4295040130615234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.449567985534668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,balanced,0.058373332023620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,1,power_law_1.2,0.5528192043304443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,balanced,0.05966933568318685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,0.6265920162200928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,balanced,0.05950400233268738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,0.7804992198944092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,balanced,0.054042667150497437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,balanced,0.06727999945481618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,0.875545597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,balanced,0.08039466540018718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,1.1039423942565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,balanced,0.08869866530100505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,1.3746111869812012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,balanced,0.090421328941981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,1.8859519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,balanced,0.12404800454775493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,balanced,0.12497066458066304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,2.4220224380493165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,power_law_1.01,0.10550400018692016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,balanced,0.12270399928092957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,balanced,0.1204853355884552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,3.516755294799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,power_law_1.01,0.09202560186386108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,balanced,0.12215999762217204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,power_law_1.01,0.0755840003490448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,balanced,0.12131733695665996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,4.345651245117187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,power_law_1.01,0.058182400465011594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,balanced,0.12031466762224834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,power_law_1.01,0.07066879868507385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,balanced,0.12157332897186279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,1,power_law_1.2,5.331206512451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,power_law_1.01,0.07929599881172181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,balanced,0.12155733505884807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,power_law_1.01,0.08155519962310791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,balanced,0.12250133355458577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,1,power_law_1.2,8.185049438476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,power_law_1.01,0.08367999792098998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,balanced,0.12545067071914673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,power_law_1.01,0.12382719516754151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,balanced,0.1304373343785604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,power_law_1.01,0.12584960460662842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,1,power_law_1.2,18.25239715576172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,power_law_1.01,0.12416640520095826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,balanced,0.13901333014170328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,power_law_1.01,0.11998080015182495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,32,power_law_1.2,0.10490880012512208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,balanced,0.15507200360298157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,power_law_1.01,0.12006399631500245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,balanced,0.04826133449872335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,power_law_1.01,0.11623680591583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,32,power_law_1.2,0.09091839790344239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,balanced,0.050053333242734276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,balanced,0.175327996412913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,power_law_1.01,0.12595200538635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,32,power_law_1.2,0.061740797758102414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,balanced,0.049226666490236916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,power_law_1.01,0.12032639980316162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,32,power_law_1.2,0.06046079993247986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,power_law_1.01,0.12298879623413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,balanced,0.04797866443792979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,balanced,0.2844746708869934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,32,power_law_1.2,0.07247359752655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,power_law_1.01,0.1292415976524353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,balanced,0.0518453319867452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,power_law_1.01,0.17304320335388185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,32,power_law_1.2,0.07868160009384155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,balanced,0.05942399799823761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,balanced,0.322869340578715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,power_law_1.01,0.1945024013519287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,32,power_law_1.2,0.08451200127601624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,balanced,0.0650186687707901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,power_law_1.01,0.22019200325012206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,32,power_law_1.2,0.08181120157241821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,balanced,0.06578666468461354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,power_law_1.01,0.30305280685424807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,balanced,0.07776000102361043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,32,power_law_1.2,0.1146239995956421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,power_law_1.01,0.34362239837646485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,balanced,0.4708426793416341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,balanced,0.08458667000134786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,32,power_law_1.2,0.12124799489974976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,power_law_1.01,0.5222847938537598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,balanced,0.07593599955240886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,32,power_law_1.2,0.12013440132141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,power_law_1.01,0.6364031791687011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,balanced,0.1257973313331604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,32,power_law_1.2,0.12269439697265624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,power_law_1.01,0.9224063873291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,balanced,0.12457066774368286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,balanced,0.6175200144449869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,32,power_law_1.2,0.12585599422454835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,power_law_1.01,1.316908836364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,balanced,0.12321066856384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,32,power_law_1.2,0.13055360317230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,power_law_1.01,1.4498047828674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,balanced,0.121888001759847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,32,power_law_1.2,0.12861440181732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,power_law_1.01,2.4223167419433596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,balanced,0.12581866979599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,32,power_law_1.2,0.12162560224533081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,power_law_1.01,5.035295867919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,balanced,0.12461333473523457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,32,power_law_1.2,0.1287168025970459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,balanced,0.12588799993197122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,balanced,0.7626773516337076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,32,power_law_1.2,0.16371840238571167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,balanced,0.1286186675230662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,32,power_law_1.2,0.18916480541229247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,balanced,0.13553067048390707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,power_law_1.01,0.07166079878807068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,32,power_law_1.2,0.22532479763031005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,balanced,0.14342400431632996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,power_law_1.01,0.09125120043754578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,32,power_law_1.2,0.2696448087692261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,balanced,0.15961066881815592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,power_law_1.01,0.06785920262336731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,32,power_law_1.2,0.38525440692901614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,power_law_1.01,0.05738880038261414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,32,power_law_1.2,0.42543997764587405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,balanced,0.17546667655309042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,balanced,1.2005813121795654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,power_law_1.01,0.05514879822731018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,32,power_law_1.2,0.6428287982940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,balanced,0.27776533365249634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,power_law_1.01,0.05554559826850891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,32,power_law_1.2,0.835807991027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,16,power_law_1.2,0.0719871997833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,32,power_law_1.2,1.4182016372680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,power_law_1.01,0.06439679861068726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,16,power_law_1.2,0.07694720029830933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,32,power_law_1.2,2.1083328247070314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,balanced,0.31838399171829224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,16,power_law_1.2,0.061964797973632815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,power_law_1.01,0.07770879864692688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,32,power_law_1.2,2.486195182800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,16,power_law_1.2,0.0576960027217865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,power_law_1.01,0.08082559704780579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,16,power_law_1.2,0.0541055977344513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,32,power_law_1.2,3.8278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,power_law_1.01,0.0735360026359558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,balanced,0.4628213246663411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,16,power_law_1.2,0.055232000350952146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,power_law_1.01,0.12006399631500245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,16,power_law_1.2,0.06227200031280518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,power_law_1.2,8.06039047241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,power_law_1.01,0.11609599590301514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,16,power_law_1.2,0.06342399716377259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,16,power_law_1.2,0.07902079820632935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,power_law_1.01,0.12244479656219483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,16,power_law_1.2,0.07994239926338195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,power_law_1.01,0.1268224000930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,balanced,0.6038133303324381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,16,power_law_1.2,0.07861120104789734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,power_law_1.01,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,32,balanced,2.364960034688314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,16,power_law_1.2,0.1254591941833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,power_law_1.01,0.12735359668731688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,16,power_law_1.2,0.12498559951782226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,16,power_law_1.2,0.12462719678878784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,power_law_1.01,0.12989439964294433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,16,power_law_1.2,0.12463359832763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,balanced,0.7473333676656088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,power_law_1.01,0.14283519983291626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,16,power_law_1.2,0.13093119859695435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,power_law_1.01,0.1826815962791443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,16,power_law_1.2,0.12955520153045655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,16,power_law_1.2,0.13826559782028197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,power_law_1.01,0.19459199905395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,16,power_law_1.2,0.15886080265045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,power_law_1.01,0.23084158897399903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,16,power_law_1.2,0.1909119963645935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,16,power_law_1.2,0.2285759925842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,power_law_1.01,0.32226560115814207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,16,power_law_1.2,0.2882688045501709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,power_law_1.01,0.39740800857543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,balanced,0.03389333436886469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,16,power_law_1.2,0.34021759033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,balanced,1.1751360098520915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,balanced,0.03579200059175491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,power_law_1.01,0.5468416213989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,16,power_law_1.2,0.5417856216430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,balanced,0.037418665985266365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,16,power_law_1.2,0.6438208103179932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,power_law_1.01,0.7692416191101075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,balanced,0.04142399877309799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,16,power_law_1.2,1.0887167930603028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,power_law_1.01,1.070195198059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,balanced,0.052101333936055504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,16,power_law_1.2,1.3630847930908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,balanced,0.060032000144322716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,power_law_1.2,1.5849087715148926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,16,power_law_1.01,1.3604479789733888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,balanced,0.06080000102519989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,power_law_1.2,2.547200012207031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,balanced,0.0610453337430954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,16,power_law_1.01,1.8888704299926757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,balanced,0.062165334820747375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,power_law_1.2,5.262815856933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,power_law_1.01,4.056563186645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,balanced,0.06310933331648509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,balanced,0.07555200159549713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,balanced,0.07507200042406718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,balanced,0.07544533411661784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,16,balanced,2.3140907287597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,balanced,0.12029866377512614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,balanced,0.12082667152086894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,balanced,0.11920000116030376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,power_law_1.01,0.03531520068645477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,balanced,0.1216266651948293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,power_law_1.01,0.04302720129489899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,balanced,0.12483732899030049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,power_law_1.01,0.04190720021724701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,power_law_1.01,0.04647040069103241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,balanced,0.13360533118247986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,power_law_1.01,0.052832001447677614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,balanced,0.14258133371671042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,power_law_1.01,0.05457280278205871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,balanced,0.16059733430544534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,power_law_1.01,0.05767040252685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,power_law_1.01,0.05856639742851257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,balanced,0.17971199750900269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,power_law_1.01,0.06071680188179016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,power_law_1.01,0.06097279787063599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,balanced,0.2799893418947856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,power_law_1.01,0.061887997388839724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,8,power_law_1.2,0.03597440123558045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,power_law_1.01,0.07552000284194946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,balanced,0.3186560074488322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,power_law_1.01,0.07297919988632202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,8,power_law_1.2,0.04394879937171936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,8,power_law_1.2,0.041017600893974306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,power_law_1.01,0.07519999742507935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,8,power_law_1.2,0.05008000135421753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,power_law_1.01,0.11799039840698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,balanced,0.4635946750640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,8,power_law_1.2,0.05114240050315857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,power_law_1.01,0.12094719409942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,8,power_law_1.2,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,power_law_1.01,0.1232192039489746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,8,power_law_1.2,0.05767679810523987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,8,power_law_1.2,0.05860480070114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,power_law_1.01,0.12548480033874512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,8,power_law_1.2,0.06149759888648987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,balanced,0.6014933188756307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,power_law_1.01,0.13829760551452636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,8,power_law_1.2,0.06258559823036194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,power_law_1.01,0.1549183964729309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,8,power_law_1.2,0.062003201246261595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,8,power_law_1.2,0.07504000067710877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,power_law_1.01,0.18273279666900635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,8,power_law_1.2,0.08011519908905029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,power_law_1.01,0.22471680641174316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,8,power_law_1.2,0.07761279940605163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,power_law_1.01,0.2688512086868286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,balanced,0.7489066918691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,8,power_law_1.2,0.11580799818038941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,power_law_1.01,0.37128961086273193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,8,power_law_1.2,0.12632960081100464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,8,power_law_1.2,0.13075200319290162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,power_law_1.01,0.45729918479919435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,8,power_law_1.2,0.1398975968360901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,power_law_1.01,0.6377600193023681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,8,power_law_1.2,0.1508288025856018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,power_law_1.01,0.8379072189331055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,8,power_law_1.2,0.16062079668045043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,power_law_1.01,1.0378368377685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,8,power_law_1.2,0.20208640098571778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,power_law_1.01,1.5414976119995116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,8,power_law_1.2,0.24110078811645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,balanced,1.1689279874165852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,8,power_law_1.2,0.29985918998718264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,power_law_1.01,3.1556159973144533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,balanced,0.029824001093705494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,8,power_law_1.2,0.3909440040588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,power_law_1.01,0.031251201033592226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,8,power_law_1.2,0.5293439865112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,balanced,0.033173332611719765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,8,power_law_1.2,0.801689624786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,balanced,0.03385599950949351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,power_law_1.01,0.03537920117378235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,8,power_law_1.2,1.0725824356079101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,balanced,0.03951466580231985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,power_law_1.01,0.03377279937267304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,8,power_law_1.2,1.3066880226135253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,balanced,0.04656533400217692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,power_law_1.01,0.04140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,balanced,0.06237866481145223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,8,power_law_1.2,1.6528511047363281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,balanced,0.06085333228111267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,power_law_1.01,0.047007998824119566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,power_law_1.2,4.174655914306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,balanced,0.06085866689682007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,power_law_1.01,0.05200639963150024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,balanced,0.060789331793785095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,power_law_1.01,0.05559679865837097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,balanced,0.0609440008799235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,power_law_1.01,0.057011198997497556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,balanced,0.061759998401006065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,balanced,0.0651093324025472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,power_law_1.01,0.05751680135726929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,8,balanced,2.3011627197265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,balanced,0.06555200119813283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,power_law_1.01,0.0580672025680542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,balanced,0.06629866858323415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,power_law_1.01,0.05856000185012818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,balanced,0.07643733421961467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,power_law_1.01,0.0636672019958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,balanced,0.0790826678276062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,power_law_1.01,0.06388480067253113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,balanced,0.07949866851170857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,power_law_1.01,0.06428160071372986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,balanced,0.13075733184814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,power_law_1.01,0.07527679800987244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,balanced,0.13422933220863342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,power_law_1.01,0.07847679853439331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,balanced,0.1434346636136373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,power_law_1.01,0.0812928020954132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,balanced,0.028437333802382152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,4,power_law_1.2,0.03123840093612671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,balanced,0.15275200208028158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,power_law_1.01,0.1357759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,balanced,0.03206400076548258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,4,power_law_1.2,0.03509120047092438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,balanced,0.03297599901755651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,balanced,0.17260799805323282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,power_law_1.01,0.14154239892959594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,4,power_law_1.2,0.03430399894714355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,balanced,0.05362666646639506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,power_law_1.01,0.1561792016029358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,4,power_law_1.2,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,balanced,0.19448000192642212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,4,power_law_1.2,0.04619520008563995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,power_law_1.01,0.1820032000541687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,balanced,0.07332799832026164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,4,power_law_1.2,0.051801598072052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,power_law_1.01,0.2255295991897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,balanced,0.07171200215816498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,balanced,0.29874134063720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,power_law_1.01,0.028812798857688903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,balanced,0.07170133292675018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,4,power_law_1.2,0.05451520085334778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,power_law_1.01,0.2673408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,balanced,0.0668693333864212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,power_law_1.01,0.03365119993686676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,4,power_law_1.2,0.05742719769477844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,power_law_1.01,0.36274559497833253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,balanced,0.34012266000111896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,balanced,0.06795200208822887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,4,power_law_1.2,0.05699840188026428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,power_law_1.01,0.03403519988059998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,power_law_1.01,0.4430272102355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,balanced,0.07427733143170674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,4,power_law_1.2,0.0584447979927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,power_law_1.01,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,balanced,0.07449066638946533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,power_law_1.01,0.6355199813842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,balanced,0.07459733386834462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,power_law_1.01,0.047417598962783816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,balanced,0.5001279910405477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,4,power_law_1.2,0.058950400352478026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,balanced,0.08210133512814839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,power_law_1.01,0.798963212966919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,balanced,0.08355733752250671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,4,power_law_1.2,0.06424319744110107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,power_law_1.01,0.05345919728279114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,power_law_1.01,1.0069503784179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,balanced,0.08582933743794759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,4,power_law_1.2,0.06330239772796631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,power_law_1.01,0.06327040195465088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,balanced,0.09634666641553243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,power_law_1.01,1.5302720069885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,4,power_law_1.2,0.06596480011940002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,power_law_1.01,0.06399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,balanced,0.10061333576838176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,balanced,0.6462399959564209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,4,power_law_1.2,0.07805439829826355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,power_law_1.01,0.06152960062026978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,power_law_1.01,3.114828872680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,balanced,0.1737920045852661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,4,power_law_1.2,0.08141440153121948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,power_law_1.01,0.06111999750137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,balanced,0.1851200064023336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,4,power_law_1.2,0.08488320112228394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,power_law_1.01,0.06302080154418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,balanced,0.21011734008789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,4,power_law_1.2,0.14369280338287355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,power_law_1.01,0.07157120108604431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,balanced,0.7984106540679932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,balanced,0.2357920010884603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,4,power_law_1.2,0.1479423999786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,power_law_1.01,0.07288320064544677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,4,power_law_1.2,0.16900479793548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,power_law_1.01,0.07407360076904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,balanced,0.389359990755717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,4,power_law_1.2,0.19812480211257935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,power_law_1.01,0.08131840229034423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,4,power_law_1.2,0.23568639755249024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,power_law_1.01,0.08320639729499817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,balanced,0.4381759961446126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,4,power_law_1.2,0.29651200771331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,power_law_1.01,0.08773760199546814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,4,power_law_1.2,0.4054399967193604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,balanced,1.2528159618377686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,power_law_1.01,0.11357439756393432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,balanced,0.6361653407414755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,4,power_law_1.2,0.47825279235839846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,power_law_1.01,0.1223423957824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,4,power_law_1.2,0.7715392112731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,power_law_1.01,0.20824320316314698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,4,power_law_1.2,0.9711872100830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,power_law_1.01,0.2284480094909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,balanced,0.8307200272878011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,4,power_law_1.2,1.1684351921081544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,power_law_1.01,0.27381761074066163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,4,power_law_1.2,1.698784065246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,power_law_1.01,0.3356287956237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,power_law_1.01,0.442303991317749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,power_law_1.2,3.536185455322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,power_law_1.01,0.5569600105285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,balanced,1.028106689453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,power_law_1.01,0.7686016082763671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,power_law_1.01,1.0225088119506835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,power_law_1.01,1.1811391830444335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,4,balanced,2.4419679641723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,power_law_1.01,1.9601280212402343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,2,power_law_1.2,0.029075199365615846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,2,power_law_1.2,0.03299199938774109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,power_law_1.01,3.4795711517333983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,balanced,1.6188160578409831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,2,power_law_1.2,0.03170560002326965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,2,power_law_1.2,0.041606399416923526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,2,power_law_1.2,0.04496639966964722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,2,power_law_1.2,0.04993920028209686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,2,power_law_1.2,0.0621504008769989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,balanced,0.025461333493391674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,2,power_law_1.2,0.06506879925727845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,balanced,0.02716800073782603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,2,power_law_1.2,0.060115200281143186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,balanced,0.029440000653266907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,2,power_law_1.2,0.06173440217971802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,2,power_law_1.2,0.06298879981040954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,balanced,0.04839999973773956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,2,power_law_1.2,0.07253119945526124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,2,power_law_1.2,0.07299839854240417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,balanced,0.07419200241565704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,2,power_law_1.2,0.07592319846153259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,power_law_1.01,0.02452480047941208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,2,power_law_1.2,0.08314239978790283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,balanced,0.07506133119265239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,balanced,3.169994672139486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,2,power_law_1.2,0.08476160168647766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,power_law_1.01,0.026348799467086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,2,power_law_1.2,0.08916479945182801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,power_law_1.01,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,balanced,0.07394133508205414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,power_law_1.01,0.03568640053272247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,2,power_law_1.2,0.12063360214233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,power_law_1.01,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,2,power_law_1.2,0.1276927947998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,balanced,0.07486933469772339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,power_law_1.01,0.048256000876426695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,balanced,0.07267199953397115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,2,power_law_1.2,0.21985280513763428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,power_law_1.01,0.060057598352432254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,balanced,0.07302933434645335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,2,power_law_1.2,0.23748478889465333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,power_law_1.01,0.061638402938842776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,balanced,0.06890133519967397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,2,power_law_1.2,0.3039423942565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,power_law_1.01,0.060249602794647215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,balanced,0.06937600175539653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,2,power_law_1.2,0.34710400104522704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,power_law_1.01,0.06320000290870667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,balanced,0.07114666700363159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,2,power_law_1.2,0.495084810256958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,power_law_1.01,0.06595839858055115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,balanced,0.07726933558781941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,power_law_1.01,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,2,power_law_1.2,0.5554240226745606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,balanced,0.07928533355395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,power_law_1.01,0.06530560255050659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,balanced,0.08313600222269694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,2,power_law_1.2,0.7658751964569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,balanced,0.09643733501434326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,2,power_law_1.2,1.0076160430908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,power_law_1.01,0.07502080202102661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,2,power_law_1.2,1.2636992454528808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,balanced,0.10327999790509541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,power_law_1.01,0.0777728021144867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,2,power_law_1.2,1.8823936462402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,balanced,0.12896533807118735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,power_law_1.01,0.08223360180854797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,2,power_law_1.2,3.7281024932861326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,power_law_1.01,0.0961408019065857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,balanced,0.1432799994945526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,power_law_1.01,0.10270719528198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,balanced,0.2523840069770813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,power_law_1.01,0.12384639978408814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,power_law_1.01,0.15389440059661866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,balanced,0.28147733211517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,power_law_1.01,0.1846783995628357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,power_law_1.01,0.31192960739135744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,balanced,0.46882665157318115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,power_law_1.01,0.38259201049804686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,power_law_1.01,0.5014272212982178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,balanced,0.531823992729187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,power_law_1.01,0.6223296165466309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,power_law_1.01,0.8539775848388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,1,power_law_1.2,0.02460159957408905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,balanced,0.7733226617177328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,power_law_1.01,1.0883584022521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,1,power_law_1.2,0.026374399662017822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,1,power_law_1.2,0.027296000719070436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,power_law_1.01,1.3222847938537599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,1,power_law_1.2,0.03431040048599243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,power_law_1.01,2.0095359802246096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,1,power_law_1.2,0.040780800580978396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,1,power_law_1.2,0.04611839950084686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,balanced,1.0082879861195881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,power_law_1.01,3.8824127197265623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,1,power_law_1.2,0.06049280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,1,power_law_1.2,0.06208639740943909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,1,power_law_1.2,0.06096640229225159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,1,power_law_1.2,0.06414080262184144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,1,power_law_1.2,0.06669440269470214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,1,power_law_1.2,0.06353279948234558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,balanced,1.2439839839935303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,1,power_law_1.2,0.06532480120658875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,1,power_law_1.2,0.07541120052337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,1,power_law_1.2,0.07887359857559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,1,power_law_1.2,0.08280959725379944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,1,power_law_1.2,0.0964031994342804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,1,power_law_1.2,0.10474879741668701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,1,power_law_1.2,0.1257599949836731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,balanced,1.9445172945658367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,1,power_law_1.2,0.15991679430007935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,1,power_law_1.2,0.18874239921569824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,1,power_law_1.2,0.3271039962768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,1,power_law_1.2,0.39670400619506835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,1,power_law_1.2,0.5127615928649902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,1,power_law_1.2,0.6334784030914307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,1,power_law_1.2,0.8623040199279786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,1,power_law_1.2,1.0926079750061035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,balanced,0.05130666494369507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,power_law_1.2,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,1,32,power_law_1.01,0.05072640180587769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,1,power_law_1.2,1.3272768020629884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,1,power_law_1.2,2.0219776153564455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,power_law_1.2,3.888915252685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,balanced,0.05258666475613912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,power_law_1.01,0.051744002103805545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,1,32,power_law_1.2,0.05130879878997803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,balanced,0.05287466446558634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,power_law_1.2,0.05148800015449524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,1,32,power_law_1.01,0.051481598615646364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,1,balanced,3.8214025497436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,balanced,0.05958400170008341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,power_law_1.01,0.05512319803237915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,1,32,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,balanced,0.04515199859937032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,power_law_1.01,0.060083198547363284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,power_law_1.2,0.060102397203445436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,balanced,0.046613335609436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,1,32,balanced,0.062405332922935486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,balanced,0.04619733492533366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,balanced,0.0476693312327067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,balanced,0.05156800150871277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,power_law_1.01,0.06844159960746765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,power_law_1.2,0.06833919882774353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,1,32,balanced,0.07036266724268596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,balanced,0.05611200133959452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,balanced,0.06252266466617584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,balanced,0.06081599990526835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,balanced,0.06756799916426341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,balanced,0.06764266888300578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,power_law_1.01,0.07070720195770264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,power_law_1.2,0.07061759829521179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,1,32,balanced,0.07226666808128357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,balanced,0.06797866523265839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,power_law_1.01,0.07112320065498352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,balanced,0.06720000008742015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,power_law_1.2,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,power_law_1.01,0.05175039768218994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,balanced,0.06821333368619283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,1,32,balanced,0.07181866466999054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,balanced,0.06855999926726024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,balanced,0.06920533378918965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,power_law_1.01,0.04578559994697571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,balanced,0.07057600220044453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,power_law_1.01,0.08354560136795045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,power_law_1.2,0.08520960211753845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,power_law_1.01,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,balanced,0.07136000196139018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,balanced,0.07456533114115398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,power_law_1.01,0.08363519906997681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,power_law_1.01,0.05233280062675476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,power_law_1.2,0.08387200236320495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,1,32,balanced,0.08368000388145447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,balanced,0.07747733096281688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,power_law_1.01,0.08391039967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,power_law_1.01,0.05811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,power_law_1.2,0.08441600203514099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,balanced,0.08828799923261006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,1,32,balanced,0.08406933148701985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,power_law_1.01,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,power_law_1.01,0.06095359921455383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,balanced,0.09638399879137675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,power_law_1.2,0.08506240248680115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,power_law_1.01,0.08504319787025452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,power_law_1.01,0.06874240040779114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,1,32,balanced,0.08463999629020691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,power_law_1.2,0.08604159951210022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,balanced,0.1536906659603119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,power_law_1.01,0.0861952006816864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,power_law_1.01,0.06738560199737549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,1,32,balanced,0.08423466483751933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,power_law_1.2,0.08716800212860107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,power_law_1.01,0.09608319997787476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,power_law_1.01,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,balanced,0.1702773372332255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,1,32,balanced,0.08513599634170532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,power_law_1.2,0.10090880393981934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,power_law_1.01,0.08819199800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,power_law_1.01,0.06757760047912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,1,32,balanced,0.0858026643594106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,power_law_1.2,0.10572160482406616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,power_law_1.01,0.11383039951324463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,balanced,0.24310932556788126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,power_law_1.01,0.06757760047912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,1,32,balanced,0.08601066470146179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,power_law_1.01,0.1300927996635437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,power_law_1.2,0.11495039463043213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,power_law_1.01,0.07031679749488831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,1,32,balanced,0.08719999591509502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,balanced,0.3091306686401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,16,power_law_1.2,0.05000320076942444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,power_law_1.01,0.16869759559631348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,power_law_1.2,0.16641279458999633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,power_law_1.01,0.06913920044898987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,power_law_1.01,0.2095423936843872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,power_law_1.2,0.18457599878311157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,16,power_law_1.2,0.04937599897384644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,power_law_1.01,0.06990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,1,32,balanced,0.08842133482297261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,power_law_1.01,0.29732480049133303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,power_law_1.2,0.25162880420684813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,16,power_law_1.2,0.046751999855041505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,power_law_1.01,0.07153919935226441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,1,32,balanced,0.09092266360918681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,balanced,0.45209066073099774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,power_law_1.01,0.43393921852111816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,power_law_1.2,0.3079807996749878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,power_law_1.01,0.07527040243148804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,16,power_law_1.2,0.04794879853725433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,1,32,balanced,0.0944053332010905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,power_law_1.01,0.5100736141204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,power_law_1.2,0.45367679595947263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,16,power_law_1.2,0.05256959795951843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,power_law_1.01,0.0960319995880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,1,32,balanced,0.10428266723950703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,power_law_1.01,0.6572288036346435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,power_law_1.2,0.5711552143096924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,16,power_law_1.2,0.058796799182891844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,power_law_1.01,0.12610559463500975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,1,32,balanced,0.11316266655921936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,power_law_1.01,1.0156224250793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,balanced,0.5914239883422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,power_law_1.2,0.8557056427001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,16,power_law_1.2,0.06270719766616821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,power_law_1.01,0.1620736002922058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,power_law_1.01,1.584275245666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,power_law_1.2,1.142912006378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,16,power_law_1.2,0.060262399911880496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,power_law_1.01,0.186188805103302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,1,32,balanced,0.14889066418011984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,power_law_1.01,2.032601547241211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,16,power_law_1.2,0.06800000071525573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,power_law_1.2,1.6980863571166993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,power_law_1.01,0.3306495904922485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,1,32,balanced,0.17056532700856528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,16,power_law_1.2,0.07117440104484558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,power_law_1.01,2.669747161865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,power_law_1.2,2.2613311767578126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,power_law_1.01,0.39114880561828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,balanced,0.7342560291290283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,16,power_law_1.2,0.0707647979259491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,power_law_1.01,4.303916931152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,power_law_1.01,0.5338431835174561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,power_law_1.2,2.7379135131835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,16,power_law_1.2,0.0670527994632721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,1,32,balanced,0.2645813425381978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,power_law_1.01,0.6941440105438232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,power_law_1.2,4.444678497314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,16,power_law_1.2,0.06862080097198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,power_law_1.01,8.63636474609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,power_law_1.01,1.1939583778381349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,16,power_law_1.2,0.06898559927940369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,1,32,balanced,0.31544532378514606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,power_law_1.2,8.837094116210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,power_law_1.01,1.3684160232543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,16,power_law_1.2,0.07325440049171447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,16,power_law_1.2,0.0800383985042572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,power_law_1.01,2.1309247970581056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,16,power_law_1.2,0.08430079817771911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,balanced,1.156725327173869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,1,32,balanced,0.4629280169804891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,power_law_1.01,3.071379280090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,16,power_law_1.2,0.11204479932785034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,power_law_1.01,5.660793685913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,16,power_law_1.2,0.13626240491867064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,balanced,0.03316266586383184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,16,power_law_1.2,0.19540480375289918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,1,32,balanced,0.604698657989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,16,power_law_1.2,0.27701120376586913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,balanced,0.0349440003434817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,16,power_law_1.2,0.4096640110015869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,16,power_law_1.2,0.5180352210998536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,16,power_law_1.2,0.8384320259094238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,balanced,0.04276266694068909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,1,32,balanced,0.7514293193817139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,16,power_law_1.2,0.9711168289184571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,16,power_law_1.2,1.5155584335327148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,balanced,0.045269335309664406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,power_law_1.01,0.03444480001926422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,16,power_law_1.2,2.1296384811401365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,balanced,2.282602628072103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,power_law_1.01,0.03526400029659271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,16,power_law_1.2,2.4169023513793944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,power_law_1.01,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,balanced,0.047466665506362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,power_law_1.01,0.03984639942646027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,16,power_law_1.2,4.27088623046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,power_law_1.01,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,1,32,balanced,1.184821367263794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,16,power_law_1.2,8.644992065429687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,power_law_1.01,0.04503679871559143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,power_law_1.01,0.046982398629188536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,power_law_1.01,0.050348800420761106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,balanced,0.05958933134873708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,power_law_1.01,0.05957760214805603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,balanced,0.06038400034109751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,power_law_1.01,0.06020479798316956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,balanced,0.05625066657861074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,power_law_1.01,0.056032001972198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,balanced,0.05540800094604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,power_law_1.01,0.058303999900817874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,balanced,0.06025066475073496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,balanced,0.05969599882761637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,power_law_1.01,0.06321920156478882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,1,32,balanced,2.34171199798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,balanced,0.06025066475073496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,power_law_1.01,0.06094719767570496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,balanced,0.061253334085146584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,power_law_1.01,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,balanced,0.06257600088914235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,power_law_1.01,0.07086719870567322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,balanced,0.06589866677920024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,power_law_1.01,0.07579519748687744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,balanced,0.06911999980608623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,power_law_1.01,0.09660159945487976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,balanced,0.09191999832789104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,power_law_1.01,0.1009600043296814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,power_law_1.01,0.1302016019821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,balanced,0.09963200489679973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,power_law_1.01,0.1640768051147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,balanced,0.1485919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,power_law_1.01,0.2183743953704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,power_law_1.01,0.2976320028305054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,balanced,0.17390400171279907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,power_law_1.01,0.40456318855285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,power_law_1.01,0.5427968025207519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,balanced,0.24938666820526123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,power_law_1.01,0.810694408416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,power_law_1.01,0.9521599769592285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,balanced,0.311082661151886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,power_law_1.01,1.493286418914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,power_law_1.01,2.1642112731933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,balanced,0.4532639980316162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,power_law_1.01,4.214668655395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,balanced,0.5911786556243896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,balanced,0.02900800108909607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,balanced,0.7354506651560465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,8,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,balanced,0.032698666055997215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,8,power_law_1.2,0.0348800003528595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,balanced,0.03330666571855545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,8,power_law_1.2,0.034668800234794614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,balanced,0.036618667344252266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,8,power_law_1.2,0.03919999897480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,8,power_law_1.2,0.0420415997505188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,power_law_1.01,0.029683199524879456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,balanced,0.03740799923737844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,8,power_law_1.2,0.04527359902858734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,power_law_1.01,0.032179200649261476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,balanced,0.03753600021203359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,8,power_law_1.2,0.047737601399421695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,balanced,1.1563786665598552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,power_law_1.01,0.03240320086479187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,8,power_law_1.2,0.049465599656105044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,power_law_1.01,0.035673600435256955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,8,power_law_1.2,0.06017919778823853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,power_law_1.01,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,balanced,0.040778666734695435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,8,power_law_1.2,0.06247040033340454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,power_law_1.01,0.03761920034885406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,8,power_law_1.2,0.057126402854919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,power_law_1.01,0.04069119989871979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,balanced,0.04008000095685323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,8,power_law_1.2,0.057196801900863646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,power_law_1.01,0.04140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,8,power_law_1.2,0.06416640281677247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,4,power_law_1.2,0.029734399914741517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,8,power_law_1.2,0.06207360029220581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,4,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,balanced,0.04363200068473816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,power_law_1.01,0.04506880044937134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,8,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,4,power_law_1.2,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,8,power_law_1.2,0.06846719980239868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,4,power_law_1.2,0.035667198896408084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,8,power_law_1.2,0.0787392020225525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,balanced,0.0447626660267512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,power_law_1.01,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,4,power_law_1.2,0.03700479865074158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,8,power_law_1.2,0.09125120043754578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,power_law_1.01,0.04545280039310455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,balanced,0.04357333481311798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,4,power_law_1.2,0.039059200882911684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,8,power_law_1.2,0.10659840106964111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,4,power_law_1.2,0.04113920032978058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,8,power_law_1.2,0.1542464017868042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,balanced,0.027802666028340656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,balanced,2.2752960522969565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,8,power_law_1.2,0.1762943983078003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,4,power_law_1.2,0.04174720048904419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,balanced,0.030906667311986286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,power_law_1.01,0.06268159747123718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,balanced,0.059434667229652405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,8,power_law_1.2,0.2522495985031128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,4,power_law_1.2,0.0447488009929657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,balanced,0.03734933336575826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,8,power_law_1.2,0.4055935859680176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,4,power_law_1.2,0.04594559967517853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,balanced,0.03851733356714249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,4,power_law_1.2,0.045491200685501096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,8,power_law_1.2,0.5622975826263428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,power_law_1.01,0.0648576021194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,4,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,8,power_law_1.2,0.7595583915710449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,balanced,0.062368000547091164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,balanced,0.03688533355792364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,power_law_1.01,0.06035839915275574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,4,power_law_1.2,0.06409599781036376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,8,power_law_1.2,1.0642751693725585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,balanced,0.05675200124581655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,power_law_1.01,0.061286401748657224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,balanced,0.03798400113979975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,4,power_law_1.2,0.060012799501419065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,power_law_1.01,0.06779519915580749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,8,power_law_1.2,1.2762816429138184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,balanced,0.057717333237330117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,balanced,0.03803733239571253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,power_law_1.01,0.07567359805107117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,4,power_law_1.2,0.06282240152359009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,balanced,0.06402133405208588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,8,power_law_1.2,1.8584064483642577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,power_law_1.01,0.08402559757232667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,power_law_1.01,0.09096320271492005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,balanced,0.06532800197601318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,4,power_law_1.2,0.06760960221290588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,8,power_law_1.2,3.0336000442504885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,balanced,0.040693332751592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,power_law_1.01,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,balanced,0.0697813332080841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,4,power_law_1.2,0.0753920018672943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,balanced,0.03957866628964742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,power_law_1.01,0.15045759677886963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,8,power_law_1.2,5.199020767211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,balanced,0.07394666473070781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,balanced,0.04030400017897288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,power_law_1.01,0.027846398949623107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,power_law_1.01,0.1811840057373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,4,power_law_1.2,0.0864192008972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,power_law_1.01,0.2807744026184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,balanced,0.0941493312517802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,power_law_1.01,0.0302592009305954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,4,power_law_1.2,0.10379519462585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,power_law_1.01,0.37760000228881835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,power_law_1.01,0.030649599432945252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,balanced,0.10292800267537434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,balanced,0.047877331574757896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,power_law_1.01,0.4490943908691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,4,power_law_1.2,0.13244800567626952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,power_law_1.01,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,balanced,0.04711466530958811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,balanced,0.15370133519172668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,power_law_1.01,0.6593791961669921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,power_law_1.01,0.03708159923553467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,4,power_law_1.2,0.14843519926071166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,balanced,0.0470719983180364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,power_law_1.01,0.9600064277648925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,power_law_1.01,0.036582401394844054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,balanced,0.18619734048843384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,4,power_law_1.2,0.20622720718383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,power_law_1.01,1.1919551849365235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,power_law_1.01,0.03976959884166718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,4,power_law_1.2,0.3042880058288574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,power_law_1.01,1.8844480514526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,power_law_1.01,0.04089600145816803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,balanced,0.2673226594924927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,4,power_law_1.2,0.4246335983276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,power_law_1.01,0.0412992000579834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,balanced,0.06815466781457265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,power_law_1.01,3.732921600341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,power_law_1.01,0.045516800880432126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,power_law_1.2,0.5823872089385986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,balanced,0.06355200211207072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,4,balanced,0.33079999685287476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,power_law_1.01,0.04668160080909729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,balanced,0.0676746666431427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,power_law_1.2,0.741977596282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,power_law_1.01,0.05175039768218994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,balanced,0.07879466811815898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,power_law_1.2,1.1675071716308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,power_law_1.01,0.05495039820671081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,balanced,0.08261866867542267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,4,balanced,0.4883626699447632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,power_law_1.01,0.05632640123367309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,balanced,0.10889599720637004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,power_law_1.2,1.3742207527160644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,power_law_1.01,0.07727360129356384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,power_law_1.2,1.8413824081420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,balanced,0.11891733606656392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,power_law_1.01,0.08368639945983887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,balanced,0.18184532721837363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,power_law_1.2,3.923667144775391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,power_law_1.01,0.08634240031242371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,4,balanced,0.6327626705169678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,power_law_1.01,0.09171839952468872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,balanced,0.22428266207377115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,power_law_1.01,0.10533119440078735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,balanced,0.32578132549921673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,power_law_1.01,0.14186240434646608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,2,power_law_1.2,0.027859199047088622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,power_law_1.01,0.1651263952255249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,4,balanced,0.7845226923624674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,2,power_law_1.2,0.030803200602531434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,power_law_1.01,0.22023680210113525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,balanced,0.42524266242980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,2,power_law_1.2,0.031379199028015135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,power_law_1.01,0.2732287883758545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,2,power_law_1.2,0.0353983998298645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,power_law_1.01,0.42580480575561525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,2,power_law_1.2,0.037529599666595456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,power_law_1.01,0.5163455963134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,2,power_law_1.2,0.03735679984092712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,balanced,0.6204959948857626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,power_law_1.01,0.8171327590942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,2,power_law_1.2,0.04081920087337494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,power_law_1.01,1.0209088325500488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,4,balanced,1.2326026757558186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,2,power_law_1.2,0.04113920032978058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,power_law_1.01,1.3143744468688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,2,power_law_1.2,0.044819200038909913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,power_law_1.01,1.898137664794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,balanced,0.8147733211517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,2,power_law_1.2,0.04657920002937317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,power_law_1.01,3.5654529571533202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,2,power_law_1.2,0.04690560102462769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,2,power_law_1.2,0.05134080052375793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,2,power_law_1.2,0.05511040091514587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,2,power_law_1.2,0.057734400033950806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,balanced,1.0089279810587566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,2,power_law_1.2,0.07928959727287292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,2,power_law_1.2,0.0833791971206665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,2,power_law_1.2,0.09074559807777405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,2,power_law_1.2,0.09524480104446412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,2,power_law_1.2,0.11331839561462402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,2,power_law_1.2,0.14856319427490233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,4,balanced,2.4158612887064614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,2,power_law_1.2,0.17461119890213012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,balanced,1.5818773905436199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,2,power_law_1.2,0.22622718811035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,2,power_law_1.2,0.2895616054534912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,2,power_law_1.2,0.43367681503295896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,2,power_law_1.2,0.5174848079681397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,2,power_law_1.2,0.848691177368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,balanced,0.024325333535671234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,2,power_law_1.2,1.0213888168334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,balanced,0.02606400102376938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,2,power_law_1.2,1.3376959800720214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,balanced,0.028538666665554047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,2,power_law_1.2,2.1154624938964846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,balanced,0.03570666660865148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,power_law_1.2,4.426969528198242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,balanced,0.035061334570248924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,balanced,0.03568000098069509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,balanced,0.03581333408753077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,2,balanced,3.109504063924154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,balanced,0.03428266694148382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,balanced,0.03674133370320002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,balanced,0.03522133330504099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,balanced,0.035189333061377205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,balanced,0.03967999915281931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,power_law_1.01,0.02385919988155365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,power_law_1.01,0.02499839961528778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,balanced,0.0391839991013209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,power_law_1.01,0.026732799410820008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,balanced,0.04009066770474116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,power_law_1.01,0.029420799016952513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,power_law_1.01,0.03498879969120026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,balanced,0.05021866659323374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,power_law_1.01,0.03492479920387268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,1,power_law_1.2,0.023712000250816344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,balanced,0.04948799808820089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,power_law_1.01,0.03568640053272247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,balanced,0.047135998805363975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,1,power_law_1.2,0.02497279942035675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,power_law_1.01,0.03692800104618073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,balanced,0.04523199796676636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,1,power_law_1.2,0.025843200087547303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,balanced,0.04755199948946635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,1,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,power_law_1.01,0.036620798707008365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,balanced,0.049695998430252075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,1,power_law_1.2,0.0345984011888504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,balanced,0.0476746658484141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,power_law_1.01,0.03944959938526153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,balanced,0.05415999889373779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,1,power_law_1.2,0.03519999980926514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,balanced,0.04788800080617269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,power_law_1.01,0.04264320135116577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,1,power_law_1.2,0.03597440123558045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,balanced,0.04779199759165446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,1,power_law_1.2,0.03685120046138764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,power_law_1.01,0.04713599979877472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,balanced,0.04878933231035868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,1,power_law_1.2,0.03918080031871796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,power_law_1.01,0.047366398572921756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,balanced,0.048325334986050926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,1,power_law_1.2,0.03963519930839539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,balanced,0.07785599927107494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,1,power_law_1.2,0.04323199987411499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,power_law_1.01,0.04992640018463135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,balanced,0.04725866516431173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,1,power_law_1.2,0.04624640047550201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,balanced,0.0845973292986552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,balanced,0.0460746685663859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,power_law_1.01,0.05566080212593079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,1,power_law_1.2,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,balanced,0.04612799982229868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,power_law_1.01,0.060761600732803345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,balanced,0.12559466560681662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,1,power_law_1.2,0.05014399886131286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,balanced,0.0462666650613149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,1,power_law_1.2,0.05569919943809509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,balanced,0.036357333262761436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,power_law_1.01,0.06533759832382202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,balanced,0.13889066378275552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,balanced,0.052229334910710655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,1,power_law_1.2,0.0602944016456604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,balanced,0.03846399982770284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,power_law_1.01,0.10154240131378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,balanced,0.05550933380921682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,1,power_law_1.2,0.06638079881668091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,balanced,0.0366239994764328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,balanced,0.21342400709788004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,power_law_1.01,0.11503360271453858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,balanced,0.056101332108179726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,1,power_law_1.2,0.103603196144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,balanced,0.037685332198937736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,power_law_1.01,0.15259519815444947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,balanced,0.05682666599750519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,1,power_law_1.2,0.11574399471282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,balanced,0.03730666637420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,balanced,0.2651253342628479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,power_law_1.01,0.1764672040939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,balanced,0.063701331615448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,1,power_law_1.2,0.1529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,balanced,0.03828799972931544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,power_law_1.01,0.22853119373321534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,balanced,0.06089066465695699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,balanced,0.03860799968242645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,1,power_law_1.2,0.17845760583877562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,balanced,0.38860265413920086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,power_law_1.01,0.30329599380493166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,balanced,0.03830400109291077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,1,power_law_1.2,0.23032960891723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,balanced,0.0836853285630544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,power_law_1.01,0.42435197830200194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,balanced,0.03878399978081385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,1,power_law_1.2,0.3044287919998169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,power_law_1.01,0.5439807891845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,balanced,0.0395413339138031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,balanced,0.5091040134429932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,balanced,0.08044800162315369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,1,power_law_1.2,0.425548791885376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,power_law_1.01,0.7797567844390869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,balanced,0.03755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,balanced,0.11083199580510457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,1,power_law_1.2,0.5495935916900635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,power_law_1.01,1.0084799766540526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,balanced,0.03791466603676478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,power_law_1.01,1.235756778717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,balanced,0.03798400113979975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,power_law_1.2,0.7808896064758301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,balanced,0.11483200391133626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,1,balanced,0.7505386670430502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,power_law_1.01,1.9295360565185546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,balanced,0.03990933299064636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,power_law_1.2,1.0147392272949218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,balanced,0.18464533487955728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,balanced,0.043280000487963356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,power_law_1.01,3.7951873779296874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,power_law_1.2,1.2387904167175292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,balanced,0.04515733321507772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,balanced,0.19760000705718994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,power_law_1.2,1.9408767700195313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,balanced,0.04624533156553904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,1,balanced,0.9842933019002279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,power_law_1.2,3.8045185089111326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,balanced,0.060559997955958046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,balanced,0.2807733416557312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,balanced,0.08055466910203297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,balanced,0.08517332871754964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,balanced,0.36166401704152423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,balanced,0.11405866344769795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,1,balanced,1.2198186715443928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,balanced,0.13099732995033264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.01,0.04322560131549835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,balanced,0.028186666468779247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,balanced,0.4484693209330241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,balanced,0.18787733713785806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.01,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,balanced,0.028175999720891316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,balanced,0.028218666712443035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.01,0.04103040099143982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,balanced,0.030266667405764263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,balanced,0.2212000091870626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.01,0.043673598766326906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,balanced,0.02993600070476532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.01,0.043833601474761966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,balanced,0.654698650042216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,balanced,0.030250666042168934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,balanced,0.0310506671667099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.01,0.04622080028057098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,balanced,0.31804800033569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,1,balanced,1.9171147346496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,balanced,0.030576000610987347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.01,0.04912000000476837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,balanced,0.03213333338499069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.01,0.05431680083274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,balanced,0.03288000077009201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.01,0.06439039707183838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.01,0.035488000512123107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,balanced,0.4115413427352905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.01,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.01,0.037555199861526486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.01,0.057683199644088745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.01,0.035359999537467955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.01,0.06112639904022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,balanced,0.5070453484853109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.01,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.01,0.03727999925613403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,balanced,0.030080000559488933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.01,0.06406400203704835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,balanced,1.3776747385660808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.01,0.03731200098991394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.01,0.08293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,balanced,0.03107733279466629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.01,0.07832959890365601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,balanced,0.03165333221356074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.01,0.03832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.01,0.09671679735183716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,balanced,0.030752000709374745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,balanced,0.755413293838501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.01,0.12617599964141846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.01,0.03989759981632233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.01,0.1332352042198181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.01,0.04500479996204376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.01,0.1829375982284546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.01,0.05125759840011597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.01,0.22070400714874266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.01,0.04560000002384186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,1,balanced,3.7880427042643228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.01,0.3335808038711548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.01,0.04723840057849884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,balanced,0.038506666819254555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.01,0.31359360218048093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.01,0.05406079888343811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,balanced,0.039461334546407066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.01,0.4102719783782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.01,0.047916799783706665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,balanced,0.03944533318281174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.01,0.059084802865982056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.01,0.5608640193939209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,balanced,1.4612213770548503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.01,0.06631039977073669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.01,0.8734784126281738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.01,0.07038080096244811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.01,1.1611455917358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.01,0.08552320003509521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.01,1.3440832138061523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.01,0.09827200174331666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.01,2.2683712005615235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.01,0.13604480028152466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,balanced,0.04819199939568838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.01,4.6218303680419925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.01,0.15679359436035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,balanced,0.05403733253479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.01,0.2030719995498657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.01,0.26445438861846926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.01,0.3602303981781006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.01,0.4604288101196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.01,0.6843135833740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,balanced,0.06553066770235698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.01,0.9741312026977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.01,1.177849578857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.01,1.882156753540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.01,3.0412736892700196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,balanced,0.07344533503055573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,balanced,0.10077333450317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,power_law_1.01,0.027577599883079527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,power_law_1.01,0.02778880000114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,balanced,0.12106133500734965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,power_law_1.01,0.02961280047893524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,balanced,0.16638933618863425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,8,8,power_law_1.2,0.04519039988517761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,power_law_1.01,0.029721599817276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,8,8,power_law_1.2,0.04625279903411865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,power_law_1.01,0.03221119940280914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,balanced,0.21481066942214966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,8,8,power_law_1.2,0.04347519874572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,power_law_1.01,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,8,8,power_law_1.2,0.04645119905471802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,power_law_1.01,0.03459199965000152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,balanced,0.32396266857783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,8,8,power_law_1.2,0.04595839977264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,power_law_1.01,0.03784320056438446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,8,8,power_law_1.2,0.04647040069103241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,power_law_1.01,0.0398144006729126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,8,8,power_law_1.2,0.04959999918937683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,balanced,0.42369067668914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,8,8,power_law_1.2,0.052799999713897705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,8,8,power_law_1.2,0.06156799793243408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,power_law_1.01,0.04046080112457275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,8,8,power_law_1.2,0.061337602138519284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,power_law_1.01,0.04574080109596253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,balanced,0.5335946480433146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,8,8,power_law_1.2,0.05753600001335144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,power_law_1.01,0.05018240213394165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,8,8,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,power_law_1.01,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,8,8,power_law_1.2,0.07348480224609374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,8,8,power_law_1.2,0.06232960224151611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,balanced,0.8376800219217936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,8,8,power_law_1.2,0.0770367980003357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,power_law_1.01,0.06423680186271667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,8,8,power_law_1.2,0.08629119992256165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,power_law_1.01,0.06771199703216553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,8,8,power_law_1.2,0.0973695993423462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,power_law_1.01,0.08020480275154114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,8,8,power_law_1.2,0.12851200103759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,8,8,power_law_1.2,0.13507200479507447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,power_law_1.01,0.097324800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,8,8,power_law_1.2,0.18053120374679565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,power_law_1.01,0.11575039625167846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,8,8,power_law_1.2,0.2159872055053711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,balanced,1.6312534014383953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,8,8,power_law_1.2,0.313427209854126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,8,8,power_law_1.2,0.31407999992370605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,8,8,power_law_1.2,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,power_law_1.01,0.14908159971237184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,8,8,power_law_1.2,0.48300800323486326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,8,8,power_law_1.2,0.037651199102401736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,8,8,power_law_1.2,0.5734335899353027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,8,8,power_law_1.2,0.03653759956359863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,8,8,power_law_1.2,0.8629376411437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,power_law_1.01,0.1851904034614563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,8,8,power_law_1.2,0.038124799728393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,8,8,power_law_1.2,1.2036928176879882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,8,8,power_law_1.2,0.027641600370407103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,power_law_1.01,0.3118016004562378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,8,8,power_law_1.2,0.03749119937419891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,8,8,power_law_1.2,1.5659071922302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,balanced,0.035162667433420815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,8,8,power_law_1.2,0.027807998657226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,8,8,power_law_1.2,0.03826560080051422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,balanced,0.03510399907827377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,8,8,power_law_1.2,2.1197248458862306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,8,8,power_law_1.2,0.02794879972934723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,power_law_1.01,0.35495040416717527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,8,8,power_law_1.2,0.039084801077842714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,balanced,0.04609066744645437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,8,8,power_law_1.2,0.029683199524879456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,power_law_1.01,0.4787583827972412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,8,8,power_law_1.2,4.6851646423339846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,balanced,0.046810666720072426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,8,8,power_law_1.2,0.04032639861106872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,8,8,power_law_1.2,0.029868799448013305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,power_law_1.01,0.7535103797912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,balanced,0.04731733103593191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,8,8,power_law_1.2,0.03201279938220978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,8,8,power_law_1.2,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,power_law_1.01,1.0734975814819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,8,8,power_law_1.2,0.03203839957714081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,balanced,0.047210668524106346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,8,8,power_law_1.2,0.04739840030670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,8,8,power_law_1.2,0.03372159898281098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,balanced,0.047024001677831016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,power_law_1.01,1.435155200958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,8,8,power_law_1.2,0.04387840032577515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,balanced,0.04804266492525736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,8,8,power_law_1.2,0.03761920034885406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,power_law_1.01,1.5005632400512696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,8,8,power_law_1.2,0.05135999917984009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,balanced,0.04710933566093445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,8,8,power_law_1.2,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,balanced,0.032746667663256325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,power_law_1.01,2.854412841796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,balanced,0.046869332591692604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,8,8,power_law_1.2,0.054092800617218016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,balanced,0.03258133431275686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,balanced,0.04680533210436503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,8,8,power_law_1.2,0.05084800124168396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,power_law_1.01,5.653235244750976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,balanced,0.04677333434422811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,8,8,power_law_1.2,0.03988479971885681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,balanced,0.034330666065216064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,balanced,0.04691733419895172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,8,8,power_law_1.2,0.06136959791183472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,8,8,power_law_1.2,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,balanced,0.05217066903909048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,balanced,0.035717333356539406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,8,8,power_law_1.2,0.060172802209854125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,8,8,power_law_1.2,0.05041279792785645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,balanced,0.05705066521962484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,balanced,0.03481066723664602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,balanced,0.05829866727193197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,8,8,power_law_1.2,0.0691968023777008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,8,8,power_law_1.2,0.051635199785232545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,balanced,0.056608001391092934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,balanced,0.03579733272393545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,8,8,power_law_1.2,0.08734719753265381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,balanced,0.06786133348941803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,balanced,0.036303999523321785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,8,8,power_law_1.2,0.10487680435180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,8,8,power_law_1.2,0.06439039707183838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,balanced,0.06710933148860931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,balanced,0.03612266729275385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,8,8,power_law_1.2,0.14295680522918702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,balanced,0.08400533596674602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,8,8,power_law_1.2,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,balanced,0.03735466549793879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,balanced,0.08453333377838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,8,8,power_law_1.2,0.15955840349197387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,8,8,power_law_1.2,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,8,8,power_law_1.2,0.2256704092025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,balanced,0.12177067001660664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,balanced,0.03752533346414566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,8,8,power_law_1.2,0.2713536024093628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,balanced,0.1275200049082438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,8,8,power_law_1.2,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,balanced,0.0391839991013209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,8,8,power_law_1.2,0.3953727960586548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,8,8,power_law_1.2,0.11278719902038574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,balanced,0.20146133502324423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,balanced,0.039818666875362396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,8,8,power_law_1.2,0.47901439666748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,balanced,0.03998400022586187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,8,8,power_law_1.2,0.7170815944671631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,balanced,0.22962667544682822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,balanced,0.02638400097688039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,8,8,power_law_1.2,0.13864320516586304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,balanced,0.051685333251953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,8,8,power_law_1.2,0.9744959831237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,balanced,0.02622399975856145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,balanced,0.051967998345692955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,8,8,power_law_1.2,1.138963222503662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,balanced,0.32942400376001996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,balanced,0.027493332823117573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,balanced,0.04896000027656555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,8,8,power_law_1.2,0.17305599451065062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,8,8,power_law_1.2,1.7748800277709962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,8,8,power_law_1.2,0.31738240718841554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,balanced,0.06163200239340464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,balanced,0.02961066613594691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,8,8,power_law_1.2,3.427155303955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,balanced,0.43268799781799316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,balanced,0.06543466448783875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,balanced,0.030266667405764263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,8,8,power_law_1.2,0.3839871883392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,balanced,0.03048533449570338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,balanced,0.08513066172599792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,8,8,power_law_1.2,0.5375232219696044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,balanced,0.5440959930419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,8,8,power_law_1.2,0.7141632080078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,balanced,0.030026666820049286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,balanced,0.09087466200192769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,8,8,power_law_1.2,1.1242112159729003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,balanced,0.03142400085926056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,8,8,power_law_1.2,1.4600383758544921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,balanced,0.12625599900881448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,balanced,0.03214933226505915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,8,8,power_law_1.2,1.6736383438110352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,8,8,power_law_1.2,2.7153663635253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,balanced,0.14387200276056925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,balanced,0.7910719712575277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,8,8,power_law_1.2,5.567903900146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,balanced,0.2086720069249471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,balanced,0.030415999392668407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,balanced,0.253440002600352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,balanced,0.031370667119820915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,balanced,0.0322026660044988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,balanced,0.3662453492482503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,balanced,0.03156266609827677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,balanced,1.4914132754007976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,balanced,0.47437866528828937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,balanced,0.04044266790151596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,balanced,0.5869280099868774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,balanced,0.041264000038305916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,balanced,0.04242133100827535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,balanced,0.8936320145924886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,balanced,0.05487466851870219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,balanced,0.061109334230422974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.01,0.04346239864826203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.01,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.01,0.04325119853019714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.01,0.04618239998817444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.01,0.04622719883918762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.01,0.04616959989070892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,balanced,0.07749866445859273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.01,0.046419200301170346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,balanced,1.7032960255940754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.01,0.04854399859905243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.01,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.01,0.051046401262283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.01,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.01,0.036371201276779175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.01,0.05127040147781372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,balanced,0.08707200487454732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.01,0.034796801209449765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.01,0.056704002618789676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.01,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,balanced,0.12169067064921062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.01,0.06280320286750793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.01,0.037376001477241516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,balanced,0.1514079968134562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.01,0.037939199805259706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.01,0.06654719710350036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.01,0.037964800000190736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,balanced,0.2311733365058899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.01,0.06839039921760559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.01,0.040633600950241086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.01,0.08665599822998046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,balanced,0.30766934156417847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.01,0.10181119441986083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.01,0.04073599874973297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,power_law_1.01,0.027225598692893982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.01,0.04352000057697296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.01,0.11471999883651733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,power_law_1.01,0.02656640112400055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,balanced,0.4484479824701945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.01,0.14706560373306274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,power_law_1.01,0.027039998769760133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.01,0.15318399667739868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.01,0.047014400362968445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,power_law_1.01,0.029235199093818665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.01,0.05235199928283692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.01,0.2361920118331909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,balanced,0.5955573320388794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.01,0.2719871997833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.01,0.050483202934265135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,power_law_1.01,0.029811200499534608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.01,0.3757695913314819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.01,0.06432639956474304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,power_law_1.01,0.031590399146080014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.01,0.587769603729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.01,0.07020800113677979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,balanced,0.7484052975972494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,power_law_1.01,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.01,0.7195583820343018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.01,0.06751999855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,power_law_1.01,0.03475199937820435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.01,1.1120448112487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.01,0.08266879916191101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.01,1.605062484741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.01,0.09355520009994507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,balanced,1.1825599670410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.01,2.389299201965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.01,0.12394239902496337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,power_law_1.01,0.04078719913959503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.01,0.14754559993743896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.01,3.4003841400146486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.01,0.19239039421081544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,power_law_1.01,0.04437119960784912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.01,0.24040958881378174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,power_law_1.01,0.045977601408958436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.01,0.34022400379180906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,power_law_1.01,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.01,0.4151616096496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.01,0.6994880199432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,power_law_1.01,0.05694720149040222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,balanced,2.3318986892700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.01,0.9455360412597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,4,power_law_1.2,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,4,power_law_1.2,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,power_law_1.01,0.06499840021133423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.01,1.2145855903625489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,4,power_law_1.2,0.03557760119438171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,4,power_law_1.2,0.04353919923305512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,power_law_1.01,0.07824000120162963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,4,power_law_1.2,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.01,1.6699712753295899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,4,power_law_1.2,0.043033599853515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,4,power_law_1.2,0.037299200892448425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,4,power_law_1.2,0.045824000239372255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.01,2.82857608795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,4,power_law_1.2,0.03702400028705597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,power_law_1.01,0.09182080030441284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,4,power_law_1.2,0.046515199542045596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,4,power_law_1.2,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,4,power_law_1.2,0.047040000557899475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,power_law_1.01,0.10927360057830811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,4,power_law_1.2,0.0377023994922638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,4,power_law_1.2,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,4,power_law_1.2,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,4,power_law_1.2,0.04991999864578247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,4,power_law_1.2,0.05043839812278748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,4,power_law_1.2,0.04159359931945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,4,power_law_1.2,0.052083200216293334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,4,power_law_1.2,0.04249599874019623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,power_law_1.01,0.145414400100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,4,power_law_1.2,0.05355520248413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,4,power_law_1.2,0.05783039927482605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,4,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,4,power_law_1.2,0.026598399877548216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,4,power_law_1.2,0.06251519918441772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,4,power_law_1.2,0.04578559994697571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,4,power_law_1.2,0.06209920048713684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,power_law_1.01,0.18265600204467775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,4,power_law_1.2,0.02690559923648834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,4,power_law_1.2,0.05006719827651977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,4,power_law_1.2,0.06513919830322265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,4,power_law_1.2,0.05614719986915588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,4,power_law_1.2,0.02778880000114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,power_law_1.01,0.2966079950332642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,4,power_law_1.2,0.06753919720649719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,4,power_law_1.2,0.06233599781990051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,4,power_law_1.2,0.029203200340270997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,4,power_law_1.2,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,power_law_1.01,0.43388800621032714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,4,power_law_1.2,0.0695680022239685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,4,power_law_1.2,0.02933120131492615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,4,power_law_1.2,0.07160959839820862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,4,power_law_1.2,0.09954559803009033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,4,power_law_1.2,0.03076480031013489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,power_law_1.01,0.5479872226715088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,4,power_law_1.2,0.08721920251846313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,4,power_law_1.2,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,4,power_law_1.2,0.11906559467315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,power_law_1.01,0.7859903812408447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,4,power_law_1.2,0.11185920238494873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,4,power_law_1.2,0.035692799091339114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,4,power_law_1.2,0.1628864049911499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,4,power_law_1.2,0.15689599514007568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,4,power_law_1.2,0.18542720079421998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,power_law_1.01,0.975596809387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,4,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,4,power_law_1.2,0.24532480239868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,4,power_law_1.2,0.1443711996078491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,4,power_law_1.2,0.038124799728393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,power_law_1.01,1.4300928115844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,4,power_law_1.2,0.3344640016555786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,4,power_law_1.2,0.1894719958305359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,power_law_1.01,1.6220544815063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,4,power_law_1.2,0.4295487880706787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,4,power_law_1.2,0.22021119594573973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,4,power_law_1.2,0.040064001083374025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,4,power_law_1.2,0.4936704158782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,power_law_1.01,2.576147270202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,4,power_law_1.2,0.4291776180267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,4,power_law_1.2,0.04446719884872437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,4,power_law_1.2,0.4322495937347412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,4,power_law_1.2,0.9145471572875976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,4,power_law_1.2,0.050367999076843264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,power_law_1.01,6.141382217407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,4,power_law_1.2,0.6346432209014893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,4,power_law_1.2,1.0419072151184081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,4,power_law_1.2,0.0500544011592865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,4,power_law_1.2,0.9959487915039062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,4,power_law_1.2,1.5606911659240723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,4,power_law_1.2,1.1537792205810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,4,power_law_1.2,2.0538751602172853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,4,power_law_1.2,0.05761920213699341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,4,power_law_1.2,1.912460708618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,4,power_law_1.2,4.3859905242919925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,4,power_law_1.2,0.06307200193405152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,balanced,0.02956799914439519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,4,power_law_1.2,3.561299133300781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,4,power_law_1.2,0.07456640005111695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,balanced,0.03019733230272929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,balanced,0.041536000867684685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,4,power_law_1.2,0.08793600201606751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,balanced,0.054586668809254967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,4,power_law_1.2,0.11481599807739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,balanced,0.048991998036702476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,balanced,0.04972266654173533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,4,power_law_1.2,0.17441279888153077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,balanced,0.04828799764315287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,balanced,0.04580266773700714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,4,power_law_1.2,0.1831168055534363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,balanced,0.047210668524106346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,balanced,0.04731733103593191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,4,power_law_1.2,0.26178560256958006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,4,power_law_1.2,0.3329983949661255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,balanced,0.047482664386431374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,4,power_law_1.2,0.6350592136383056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,balanced,0.048528000712394714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,balanced,0.04796266555786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,4,power_law_1.2,0.9415040016174316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,balanced,0.0488373339176178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,4,power_law_1.2,1.0805760383605958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,balanced,0.06359999875227611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,4,power_law_1.2,1.3518336296081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,balanced,0.06437866886456807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,4,power_law_1.2,2.1982143402099608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,balanced,0.060602664947509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,4,power_law_1.2,3.392185592651367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,balanced,0.07322666545708974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,4,power_law_1.2,7.020556640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,balanced,0.07035733262697856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,balanced,0.09642666578292847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,balanced,0.0322080006202062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,balanced,0.09589333335558574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,balanced,0.14010666807492575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,balanced,0.033887999753157295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,balanced,0.1747466723124186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,balanced,0.03577066709597906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,balanced,0.037178667883078255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,balanced,0.24919466177622476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,balanced,0.03689600030581156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,balanced,0.2958880066871643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,balanced,0.03786666691303253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,balanced,0.038160001238187156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,balanced,0.4255839983622233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.01,0.03250559866428375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,balanced,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,balanced,0.03976000100374222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.01,0.03430399894714355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,balanced,0.5915413300196329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,balanced,0.03842133283615112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,balanced,0.03869866579771042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.01,0.053478401899337766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,balanced,0.039306665460268654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.01,0.047302401065826415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,balanced,0.7354719638824463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,balanced,0.04049066702524821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.01,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,balanced,0.026261332134405773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,balanced,0.05230399966239929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.01,0.05299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.01,0.05077760219573975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,balanced,0.05230399966239929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,balanced,0.02658133457104365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.01,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,balanced,0.027802666028340656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,balanced,0.05217599868774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,balanced,1.031056006749471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.01,0.05189120173454285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,balanced,0.029978667696317036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,balanced,0.06803733110427856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,balanced,0.029813334345817566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.01,0.049932798743247984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,balanced,0.07069333394368489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,balanced,0.030533333619435627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.01,0.05375360250473023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,balanced,0.0925439993540446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,balanced,0.031701333820819855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.01,0.05541759729385376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,balanced,0.10286933183670044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,balanced,0.03075733284155528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.01,0.0621504008769989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.01,0.07384960055351257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,balanced,0.14477866888046265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.01,0.07493759989738465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,balanced,0.03342399994532267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,balanced,0.17546667655309042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.01,0.07425280213356018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,balanced,1.9613866806030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.01,0.08828799724578858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,balanced,0.25474133094151813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.01,0.09576320052146911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.01,0.03423359990119934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.01,0.13441920280456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,balanced,0.3232906659444173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.01,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.01,0.14236799478530884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.01,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,balanced,0.03287466615438461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.01,0.1919935941696167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.01,0.036499199271202085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,balanced,0.4715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,balanced,0.03358400116364161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.01,0.036934399604797365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.01,0.26776320934295655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.01,0.03763200044631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,balanced,0.035418666899204254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.01,0.3763008117675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.01,0.03971199989318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,balanced,0.03579200059175491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.01,0.039647999405860904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.01,0.41534080505371096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,balanced,0.5982293287913004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.01,0.04142720103263855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.01,0.5497344017028809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.01,0.042131200432777405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.01,0.041715198755264284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.01,0.941260814666748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,balanced,0.04590400060017904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.01,0.04287360012531281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,balanced,0.7352266311645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.01,1.257759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,2,power_law_1.2,0.03192319869995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,balanced,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.01,0.0447488009929657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.01,1.778451156616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.01,0.05240960121154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,balanced,0.052570665876070656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,2,power_law_1.2,0.03258239924907684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.01,0.0593280017375946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,power_law_1.01,0.026163199543952943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.01,2.8355520248413084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,2,power_law_1.2,0.03323520123958588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.01,0.06255360245704651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,2,power_law_1.2,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,power_law_1.01,0.026284798979759216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.01,0.06749439835548401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,balanced,1.1333599885304768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,2,power_law_1.2,0.047219198942184445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,balanced,0.07096533477306366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.01,0.08346880078315735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,power_law_1.01,0.026764801144599913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,2,power_law_1.2,0.05149440169334411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.01,0.0877888023853302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,balanced,0.0775786687930425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.01,0.12108800411224366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,2,power_law_1.2,0.05279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,power_law_1.01,0.0298880010843277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.01,0.13682559728622437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,2,power_law_1.2,0.05015040040016174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,power_law_1.01,0.033164799213409424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.01,0.18385920524597169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,2,power_law_1.2,0.05161600112915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,balanced,0.1030399998029073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.01,0.2325824022293091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,power_law_1.01,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,2,power_law_1.2,0.05107839703559876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.01,0.3186559915542603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,2,power_law_1.2,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,power_law_1.01,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,balanced,2.2914932568868003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.01,0.40668158531188964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,2,power_law_1.2,0.05001599788665771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.01,0.6199168205261231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,power_law_1.01,0.035955199599266054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,2,power_law_1.2,0.052902400493621826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,balanced,0.12384000420570374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.01,0.8198592185974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,power_law_1.01,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,2,power_law_1.2,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.01,1.0652480125427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,2,power_law_1.2,0.07170559763908387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,balanced,0.19690666596094766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,2,power_law_1.2,0.0781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.01,1.8004480361938477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,power_law_1.01,0.04354560077190399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,balanced,0.25305066506067914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,2,power_law_1.2,0.07678719758987426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.01,3.0913728713989257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,power_law_1.01,0.04520959854125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,2,power_law_1.2,0.09667840003967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,balanced,0.36318401495615643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,power_law_1.01,0.04560000002384186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,2,power_law_1.2,0.1058303952217102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,power_law_1.01,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,2,power_law_1.2,0.13076479434967042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,balanced,0.47575998306274414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,2,power_law_1.2,0.14256639480590821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,2,power_law_1.2,0.03378559947013855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,power_law_1.01,0.06102399826049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,2,power_law_1.2,0.20276479721069335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,balanced,0.7001492977142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,2,power_law_1.2,0.03390080034732819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,power_law_1.01,0.06391040086746216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,2,power_law_1.2,0.259008002281189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,2,power_law_1.2,0.03287039995193482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,power_law_1.01,0.07496320009231568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,2,power_law_1.2,0.3661887884140015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,2,power_law_1.2,0.036595198512077334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,2,power_law_1.2,0.4280576229095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,balanced,0.9168586730957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,2,power_law_1.2,0.036550399661064145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,power_law_1.01,0.09126399755477906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,2,power_law_1.2,0.603001594543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,2,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,2,power_law_1.2,1.0068608283996583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,power_law_1.01,0.09898880124092102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,2,power_law_1.2,1.2032320022583007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,2,power_law_1.2,0.039155200123786926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,balanced,1.147818644841512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,2,power_law_1.2,0.04021120071411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,2,power_law_1.2,1.6837055206298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,power_law_1.01,0.12091519832611083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,2,power_law_1.2,0.04071039855480194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,2,power_law_1.2,2.337414360046387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,2,power_law_1.2,0.04176000058650971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,2,power_law_1.2,0.04084480106830597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,power_law_1.01,0.19510400295257568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,2,power_law_1.2,0.04259200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,power_law_1.01,0.29857280254364016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,2,power_law_1.2,0.04653440117835998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,balanced,1.8204639752705891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,2,power_law_1.2,0.05367040038108826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,power_law_1.01,0.3427776098251343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,2,power_law_1.2,0.05961599946022034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,power_law_1.01,0.5559232234954834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,2,power_law_1.2,0.06454399824142457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,power_law_1.01,0.6801087856292725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,2,power_law_1.2,0.07043840289115906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,power_law_1.01,1.190719985961914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,2,power_law_1.2,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,power_law_1.01,1.448812770843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,2,power_law_1.2,0.09123839735984803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,power_law_1.01,1.5362431526184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,2,power_law_1.2,0.11827199459075928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,2,power_law_1.2,0.14302719831466676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,balanced,3.595973332722982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,power_law_1.01,3.028006362915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,2,power_law_1.2,0.19343359470367433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,2,power_law_1.2,0.21765758991241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,power_law_1.01,5.376678466796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,2,power_law_1.2,0.324288010597229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,2,power_law_1.2,0.46594557762145994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,2,power_law_1.2,0.6355967998504639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,2,power_law_1.2,0.02654080092906952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,2,power_law_1.2,0.9375552177429199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,2,power_law_1.2,0.026771199703216553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,2,power_law_1.2,1.1512063980102538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,2,power_law_1.2,1.4177920341491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,2,power_law_1.2,0.02710399925708771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,2,power_law_1.2,0.02943359911441803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,2,power_law_1.2,3.1278783798217775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,2,power_law_1.2,0.029414400458335876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,2,power_law_1.2,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,2,power_law_1.2,0.03214719891548157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,2,power_law_1.2,0.03312000036239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,2,power_law_1.2,0.03413119912147522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,balanced,0.06833600004514058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,2,power_law_1.2,0.035769599676132205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,balanced,0.060826669136683144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,balanced,0.057274664441744484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,2,power_law_1.2,0.0430400013923645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,balanced,0.05770133435726166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,balanced,0.05875733494758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,2,power_law_1.2,0.04431999921798706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,balanced,0.058186665177345276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,2,power_law_1.2,0.04519680142402649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,balanced,0.058975999553998314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,2,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,balanced,0.06145066519578298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,balanced,0.05957333246866862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,2,power_law_1.2,0.060627198219299315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,balanced,0.05921066800753275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,2,power_law_1.2,0.0639360010623932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,balanced,0.059088001648585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,2,power_law_1.2,0.07059839963912964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,balanced,0.06063466767470042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,2,power_law_1.2,0.09347839951515198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,balanced,0.06066133578618368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,2,power_law_1.2,0.10852479934692383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,balanced,0.06974933544794719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,balanced,0.041663999358812966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,balanced,0.07097599903742473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,2,power_law_1.2,0.14696320295333862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,balanced,0.043696001172065735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,balanced,0.0738613357146581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,balanced,0.04199466605981191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,balanced,0.08558400472005208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,balanced,0.04238399863243103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,balanced,0.04394666850566864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,2,power_law_1.2,0.21237759590148925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,balanced,0.0796853353579839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,balanced,0.043706665436426796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,2,power_law_1.2,0.3004928112030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,balanced,0.1136799951394399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,balanced,0.04573333263397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,balanced,0.04721599817276001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,2,power_law_1.2,0.38939518928527833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,balanced,0.11121599872907002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,balanced,0.04892266790072123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,2,power_law_1.2,0.5468095779418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,balanced,0.04596266647179922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,balanced,0.17495999733606973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,balanced,0.04903466502825419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,2,power_law_1.2,0.8440383911132813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,balanced,0.05028266708056132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,2,power_law_1.2,1.0144960403442382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,balanced,0.16897600889205933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,balanced,0.050997331738471985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,balanced,0.035242666800816856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,balanced,0.06001600126425425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,2,power_law_1.2,1.353548812866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,balanced,0.060218666990598045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,balanced,0.25428799788157147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,balanced,0.0645066648721695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,2,power_law_1.2,1.605753517150879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,balanced,0.03418133407831192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,balanced,0.07286933561166127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,balanced,0.28485333919525146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,2,power_law_1.2,2.510393524169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,balanced,0.036831999818483986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,balanced,0.07710400223731995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,balanced,0.10281599561373393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,balanced,0.03700266778469086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,2,power_law_1.2,6.182502365112304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,balanced,0.11202133695284526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,balanced,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,balanced,0.41941332817077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,balanced,0.1590720017751058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,balanced,0.0377813329299291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,balanced,0.17704532543818155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.01,0.06693120002746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,balanced,0.03815466662247976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,balanced,0.5290506680806478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,balanced,0.04214933514595032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,balanced,0.25878934065500897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.01,0.059308797121047974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.01,0.05592319965362549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,balanced,0.3060479958852132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,balanced,0.6734240055084229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.01,0.05727360248565674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,balanced,0.4474613269170125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.01,0.05726720094680786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.01,0.060134398937225345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,balanced,0.04126933217048645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.01,0.04133760035037994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.01,0.06472960114479065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,balanced,0.5686879952748617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,balanced,0.04142933338880539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.01,0.04391680061817169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,balanced,1.0321866671244304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.01,0.06240000128746033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,balanced,0.043807998299598694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.01,0.04132480025291443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.01,0.06379520297050476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,balanced,0.043706665436426796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.01,0.04221439957618713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.01,0.06787840127944947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,balanced,0.7095306714375814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.01,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.01,0.04353919923305512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.01,0.04643200039863586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.01,0.08457599878311158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.01,0.048902401328086854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.01,0.09052799940109253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.01,0.05067520141601563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.01,0.08281599879264831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,balanced,1.1064586639404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,balanced,0.0521066685517629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.01,0.09785599708557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.01,0.05246719717979431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,balanced,2.0468212763468423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,balanced,0.05305600166320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.01,0.114028799533844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.01,0.05649920105934143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,balanced,0.05414933462937673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.01,0.14011520147323608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.01,0.055827200412750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,power_law_1.01,0.0346560001373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.01,0.18094719648361207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.01,0.059961599111557004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,power_law_1.01,0.03335680067539215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.01,0.06524159908294677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.01,0.2010432004928589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,power_law_1.01,0.03404799997806549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.01,0.06290559768676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,power_law_1.01,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,balanced,2.1512266794840493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.01,0.2639039993286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.01,0.07645440101623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,8,8,power_law_1.2,0.06664320230484008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,balanced,0.0659093310435613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,power_law_1.01,0.03669120073318481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.01,0.2764991998672485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.01,0.08291839957237243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,balanced,0.06836799780527751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,8,8,power_law_1.2,0.058796799182891844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,power_law_1.01,0.038867199420928956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.01,0.09300479888916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.01,0.3691711902618408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,8,8,power_law_1.2,0.05596799850463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,power_law_1.01,0.04535680115222931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.01,0.11208959817886352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.01,0.6001855850219726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,8,8,power_law_1.2,0.05766400098800659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,power_law_1.01,0.04590719938278198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.01,0.1299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.01,0.874015998840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,8,8,power_law_1.2,0.05749120116233826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,power_law_1.01,0.05238400101661682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,8,8,power_law_1.2,0.060115200281143186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.01,0.18995840549468995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.01,0.9160127639770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,power_law_1.01,0.05799040198326111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,8,8,power_law_1.2,0.06596480011940002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.01,0.22590079307556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.01,1.2655360221862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,balanced,0.08619733651479085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,8,8,power_law_1.2,0.06372479796409607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.01,0.3638592004776001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.01,1.9445695877075195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,8,8,power_law_1.2,0.06494719982147217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,power_law_1.01,0.05183359980583191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.01,0.38181118965148925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.01,2.5460416793823244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,8,8,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.01,0.5963520050048828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,power_law_1.01,0.061862397193908694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,8,8,power_law_1.2,0.07672960162162781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.01,0.6866432189941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,balanced,0.09893866380055745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.01,3.4425022125244142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,8,8,power_law_1.2,0.08161280155181885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.01,0.9669952392578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,balanced,0.14103466272354126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,8,8,power_law_1.2,0.10198400020599366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,power_law_1.01,0.06858879923820496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.01,6.665248107910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.01,1.3354944229125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,8,8,power_law_1.2,0.08296959996223449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,balanced,0.16223466396331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,8,8,power_law_1.2,0.10712959766387939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.01,1.7608959197998046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,8,8,power_law_1.2,0.1084671974182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,power_law_1.01,0.07657600045204163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,8,8,power_law_1.2,0.14109439849853517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.01,2.872537612915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,8,8,power_law_1.2,0.17708799839019776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,power_law_1.01,0.08911359906196595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.01,4.6897727966308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,8,8,power_law_1.2,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,power_law_1.01,0.1091007947921753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,8,8,power_law_1.2,0.29922559261322024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,8,8,power_law_1.2,0.291814398765564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,balanced,0.23434666792551676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,8,8,power_law_1.2,0.43445758819580077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,8,8,power_law_1.2,0.5833663940429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,balanced,0.3147626717885335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,power_law_1.01,0.11930880546569825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,8,8,power_law_1.2,0.8640000343322753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,power_law_1.01,0.16037119626998902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,8,8,power_law_1.2,0.8814399719238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,balanced,0.4651679992675781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,8,8,power_law_1.2,1.3583295822143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,8,8,power_law_1.2,1.7556991577148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,power_law_1.01,0.22304000854492187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,balanced,0.6184106667836508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,8,8,power_law_1.2,2.5403263092041017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,8,8,power_law_1.2,3.37918701171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,power_law_1.01,0.2704063892364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,power_law_1.01,0.4600128173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,balanced,0.772869348526001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,8,8,power_law_1.2,7.045664215087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,power_law_1.01,0.48265600204467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,power_law_1.01,0.7548031806945801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,power_law_1.01,1.1047295570373534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,balanced,1.2272160053253174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,power_law_1.01,1.3082624435424806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,power_law_1.01,2.12042236328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,power_law_1.01,2.529804801940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,8,8,power_law_1.2,0.0377344012260437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,power_law_1.01,3.831897735595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,8,8,power_law_1.2,0.04257920086383819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,power_law_1.01,7.712384033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,8,8,power_law_1.2,0.03716480135917664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,balanced,2.3920532862345376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,8,8,power_law_1.2,0.039443200826644896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,8,8,power_law_1.2,0.03959679901599884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,8,8,power_law_1.2,0.045977601408958436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,8,8,power_law_1.2,0.049420800805091855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,8,8,power_law_1.2,0.05106559991836548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,8,8,power_law_1.2,0.05322239995002746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,8,8,power_law_1.2,0.055219197273254396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,8,8,power_law_1.2,0.058220797777175905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,8,8,power_law_1.2,0.06448000073432922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,8,8,power_law_1.2,0.06373760104179382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,8,8,power_law_1.2,0.06350079774856568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,8,8,power_law_1.2,0.0791167974472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,8,8,power_law_1.2,0.0766975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,8,8,power_law_1.2,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,8,8,power_law_1.2,0.12494720220565796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,8,8,power_law_1.2,0.14191999435424804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,8,8,power_law_1.2,0.19993599653244018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,8,8,power_law_1.2,0.25217280387878416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,8,8,power_law_1.2,0.368287992477417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,8,8,power_law_1.2,0.3977024078369141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,8,8,power_law_1.2,0.034867200255393985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,8,8,power_law_1.2,0.640831995010376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,8,8,power_law_1.2,0.6705344200134278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,8,8,power_law_1.2,0.03343999981880188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,8,8,power_law_1.2,1.0198847770690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,8,8,power_law_1.2,0.034016001224517825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,balanced,0.04923200110594431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,8,8,power_law_1.2,1.4180416107177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,8,8,power_law_1.2,0.03615359961986542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,8,8,power_law_1.2,1.7210048675537108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,balanced,0.048986668388048805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,8,8,power_law_1.2,0.036160001158714296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,8,8,power_law_1.2,2.929427146911621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,8,8,power_law_1.2,0.04039680063724518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,balanced,0.05459199845790863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,8,8,power_law_1.2,0.04517120122909546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,balanced,0.05766933163007101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,8,8,power_law_1.2,5.150707244873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,8,8,power_law_1.2,0.04792959988117218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,balanced,0.05770133435726166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,8,8,power_law_1.2,0.05459840297698974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,balanced,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,8,8,power_law_1.2,0.056908798217773435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,balanced,0.05881066620349884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,balanced,0.059338668982187905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,balanced,0.05957333246866862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,8,8,power_law_1.2,0.052134400606155394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,balanced,0.05993066728115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,8,8,power_law_1.2,0.058156800270080564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,8,8,power_law_1.2,0.060844802856445314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,balanced,0.03847466657559077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,balanced,0.06029866635799408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,8,8,power_law_1.2,0.07874559760093688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,balanced,0.06067200005054474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,balanced,0.03868799904982249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,balanced,0.039333333571751915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,balanced,0.0629066675901413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,8,8,power_law_1.2,0.08386560082435608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,balanced,0.04172799984614054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,balanced,0.06968533496061961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,balanced,0.041877334316571556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,8,8,power_law_1.2,0.09060479998588562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,balanced,0.04258666435877482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,balanced,0.07050133248170216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,8,8,power_law_1.2,0.10199040174484253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,balanced,0.043653334180514015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,balanced,0.07461866736412048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,balanced,0.043477331598599754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,balanced,0.08449066678682964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,balanced,0.04804266492525736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,balanced,0.049045334259668984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,balanced,0.09077866872151692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,8,8,power_law_1.2,0.13445760011672975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,balanced,0.046800002455711365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,balanced,0.11428800225257874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,8,8,power_law_1.2,0.16558079719543456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,balanced,0.04846400022506714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,balanced,0.141077329715093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,balanced,0.05027199784914652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,balanced,0.05359466870625814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,balanced,0.03046400099992752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,balanced,0.16472533345222473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,8,8,power_law_1.2,0.2320768117904663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,balanced,0.06126399834950765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,balanced,0.06177066763242086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,balanced,0.029818666477998097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,balanced,0.21342400709788004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,balanced,0.06654933094978333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,8,8,power_law_1.2,0.27083520889282225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,balanced,0.03224000086386999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,balanced,0.07789866626262665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,balanced,0.2968906760215759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,8,8,power_law_1.2,0.47079038619995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.01,0.055827200412750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,balanced,0.08301333089669545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,balanced,0.03513599932193756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,balanced,0.11037866274515788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,8,8,power_law_1.2,0.5142975807189941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.01,0.05457280278205871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,balanced,0.035391998787721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,balanced,0.3276960055033366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,balanced,0.1300373375415802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.01,0.04852479994297028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,balanced,0.037151999771595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,balanced,0.16502933700879416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,8,8,power_law_1.2,0.828486442565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.01,0.05649920105934143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,balanced,0.4827839930852254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.01,0.056959998607635495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,balanced,0.20891733964284262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,8,8,power_law_1.2,1.0626879692077638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,balanced,0.03757333258787791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.01,0.06094080209732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,8,8,power_law_1.2,1.4681471824645995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,balanced,0.2932959993680318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.01,0.0641152024269104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,8,8,power_law_1.2,2.049728012084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,balanced,0.6136800050735474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.01,0.06253439784049988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,balanced,0.35290666421254474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,balanced,0.042410666743914284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.01,0.06589440107345582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.01,0.04038400053977966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,8,8,power_law_1.2,2.483059120178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,balanced,0.043493335445721946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.01,0.07154560089111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,balanced,0.5168533325195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.01,0.040889599919319154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,8,8,power_law_1.2,4.110579299926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,balanced,0.7675893306732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.01,0.07482879757881164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.01,0.03831680119037628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.01,0.07861120104789734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,8,8,power_law_1.2,8.198438262939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,balanced,0.6596266825993856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.01,0.041459199786186215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.01,0.07505279779434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.01,0.042028799653053284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.01,0.08519039750099182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,power_law_1.01,0.031711998581886294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,balanced,0.0415786678592364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.01,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.01,0.09132800102233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,balanced,0.8191573619842529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,balanced,1.2274133364359539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,power_law_1.01,0.0319680005311966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,balanced,0.04363200068473816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.01,0.10624639987945557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.01,0.04888960123062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,power_law_1.01,0.031353598833084105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,balanced,0.044821331898371376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.01,0.11828479766845704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.01,0.0495743989944458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.01,0.14046720266342164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,power_law_1.01,0.034092798829078674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,balanced,0.04673066735267639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.01,0.0513152003288269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.01,0.14622080326080322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,power_law_1.01,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,balanced,1.2831573486328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.01,0.0532800018787384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.01,0.19815679788589477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,power_law_1.01,0.04232319891452789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.01,0.05602560043334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.01,0.24098560810089112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,power_law_1.01,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.01,0.05812479853630066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.01,0.2717952013015747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,balanced,2.4078453381856284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,power_law_1.01,0.04347519874572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.01,0.3767807960510254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.01,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,balanced,0.05564799904823303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.01,0.6970943927764892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.01,0.0567359983921051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,balanced,0.05622933308283488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,power_law_1.01,0.04656639993190766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.01,0.07325440049171447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.01,0.7833280086517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,balanced,0.05930666625499725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,balanced,2.51639461517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,power_law_1.01,0.048089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.01,0.07690879702568054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.01,1.0799103736877442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.01,0.08603519797325135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.01,1.5844096183776855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,balanced,0.0749066670735677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.01,0.11345280408859253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.01,1.4632448196411132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,power_law_1.01,0.05322880148887634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,balanced,0.0804319977760315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.01,0.11512960195541382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.01,3.1501440048217773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,power_law_1.01,0.056480002403259275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.01,0.16540160179138183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,power_law_1.01,0.057683199644088745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.01,7.412544250488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.01,0.21068160533905028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,4,power_law_1.2,0.05514240264892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,power_law_1.01,0.06632320284843445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,balanced,0.10421866178512573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.01,0.27749760150909425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,4,power_law_1.2,0.051622402667999265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.01,0.3348160028457642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,balanced,0.11963199575742085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,4,power_law_1.2,0.05103999972343445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,power_law_1.01,0.07397119998931885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.01,0.45998082160949705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,4,power_law_1.2,0.05600000023841858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,power_law_1.01,0.07502080202102661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,4,power_law_1.2,0.056531202793121335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.01,0.6250239849090576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,power_law_1.01,0.09182720184326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,4,power_law_1.2,0.05866879820823669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.01,1.0705599784851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,4,power_law_1.2,0.05989760160446167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,balanced,0.1807360053062439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,4,power_law_1.2,0.06234880089759827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.01,1.2103039741516113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,power_law_1.01,0.12362240552902222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,4,power_law_1.2,0.0642304003238678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,balanced,0.23409066597620645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.01,1.5159680366516113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,4,power_law_1.2,0.0707264006137848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,power_law_1.01,0.13379199504852296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,4,power_law_1.2,0.07456640005111695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,balanced,0.34671998023986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.01,2.9923776626586913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,4,power_law_1.2,0.0751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,4,power_law_1.2,0.07895680069923401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,power_law_1.01,0.24439680576324463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,4,power_law_1.2,0.09095039963722229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.01,4.316134262084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,balanced,0.4515999952952067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,4,power_law_1.2,0.10151679515838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,power_law_1.01,0.25553920269012453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,4,power_law_1.2,0.10164480209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,balanced,0.6686506271362305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,4,power_law_1.2,0.11818239688873292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,power_law_1.01,0.4505727767944336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,4,power_law_1.2,0.15043840408325196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,4,power_law_1.2,0.1566975951194763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,power_law_1.01,0.5533504009246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,4,power_law_1.2,0.21400320529937744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,balanced,0.8836692969004313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,power_law_1.01,0.8784064292907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,4,power_law_1.2,0.27908480167388916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,power_law_1.01,0.961184024810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,4,power_law_1.2,0.3021631956100464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,power_law_1.01,1.5300864219665526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,4,power_law_1.2,0.4538879871368408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,balanced,1.1062933603922527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,power_law_1.01,2.052524757385254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,4,power_law_1.2,0.6360000133514404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,4,power_law_1.2,0.7525760173797608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,power_law_1.01,2.6848447799682615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,4,power_law_1.2,1.3052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,power_law_1.01,3.7429569244384764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,4,power_law_1.2,1.567084789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,balanced,1.7537706693013508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,4,power_law_1.2,1.945471954345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,power_law_1.01,8.720780944824218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,4,power_law_1.2,3.7709312438964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,4,power_law_1.2,4.592588806152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,balanced,3.468970616658529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,4,power_law_1.2,0.03989120125770569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,4,power_law_1.2,0.040659201145172116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,4,power_law_1.2,0.039443200826644896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,4,power_law_1.2,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,4,power_law_1.2,0.04200319945812225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,4,power_law_1.2,0.04618239998817444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,4,power_law_1.2,0.04601599872112274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,4,power_law_1.2,0.0502016007900238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,4,power_law_1.2,0.05135359764099121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,4,power_law_1.2,0.05110399723052979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,4,power_law_1.2,0.05598719716072083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,4,power_law_1.2,0.05667200088500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,4,power_law_1.2,0.05916799902915955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,4,power_law_1.2,0.06313599944114685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,balanced,0.03965333352486292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,4,power_law_1.2,0.07381759881973267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,4,power_law_1.2,0.08394880294799804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,balanced,0.04422399898370107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,balanced,0.05479466418425242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,4,power_law_1.2,0.08782079815864563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,4,power_law_1.2,0.032332798838615416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,balanced,0.056885331869125366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,4,power_law_1.2,0.10958720445632934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,balanced,0.0569706658522288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,4,power_law_1.2,0.0321152001619339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,4,power_law_1.2,0.13741439580917358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,balanced,0.05862399935722351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,4,power_law_1.2,0.03224320113658905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,4,power_law_1.2,0.1857792019844055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,balanced,0.05805333455403646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,4,power_law_1.2,0.03493120074272156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,4,power_law_1.2,0.18721920251846313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,balanced,0.03515200068553289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,balanced,0.057775999108950295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,4,power_law_1.2,0.03330560028553009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,4,power_law_1.2,0.2954495906829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,balanced,0.036271999279658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,balanced,0.05970133344332377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,4,power_law_1.2,0.040908798575401306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,balanced,0.04051200052102407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,balanced,0.059952000776926674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,4,power_law_1.2,0.40991997718811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,4,power_law_1.2,0.04338560104370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,balanced,0.04223999877770742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,balanced,0.06158400078614553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,4,power_law_1.2,0.04508799910545349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,balanced,0.04333333174387614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,4,power_law_1.2,0.5929791927337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,balanced,0.0622026671965917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,balanced,0.043738668163617454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,balanced,0.06258133550484975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,4,power_law_1.2,0.04593920111656189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,4,power_law_1.2,0.6708735942840576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,balanced,0.04557866851488749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,balanced,0.06605333089828491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,4,power_law_1.2,0.04700160026550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,balanced,0.044821331898371376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,balanced,0.07172266642252605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,4,power_law_1.2,1.1076095581054688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,balanced,0.04938133557637533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,balanced,0.07299200197060902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,4,power_law_1.2,1.2231807708740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,balanced,0.07852800190448761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,balanced,0.05045866469542185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,4,power_law_1.2,0.05400959849357605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,balanced,0.0934986670811971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,balanced,0.047498668233553566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,4,power_law_1.2,1.757766342163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,4,power_law_1.2,0.05671679973602295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,balanced,0.10371200243631999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,balanced,0.0503359983364741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,4,power_law_1.2,0.059622400999069215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,balanced,0.12302933136622111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,4,power_law_1.2,2.8535104751586915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,balanced,0.05150400102138519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,4,power_law_1.2,0.07561600208282471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,balanced,0.1527786652247111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,4,power_law_1.2,4.5950462341308596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,balanced,0.19220266739527384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,4,power_law_1.2,0.08555520176887513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,balanced,0.26366400718688965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,balanced,0.029546665648619335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,balanced,0.06344533463319142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,4,power_law_1.2,0.08770560026168824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,balanced,0.029839999973773956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,balanced,0.3646453221638997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,balanced,0.06518400212128957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,4,power_law_1.2,0.10164480209350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,balanced,0.03449599941571554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,balanced,0.036992001036802925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,balanced,0.07044266661008199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,balanced,0.41361598173777264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,4,power_law_1.2,0.14816000461578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,balanced,0.03809600075085958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,4,power_law_1.2,0.14549119472503663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,balanced,0.08504533767700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,balanced,0.03997866561015447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,balanced,0.5883413155873617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,balanced,0.09515733520189922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,4,power_law_1.2,0.24926719665527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,balanced,0.04248533149560293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,4,power_law_1.2,0.28370559215545654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,balanced,0.11689066886901855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,balanced,0.041562666495641075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,balanced,0.7763360341389974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.01,0.044512000679969785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,balanced,0.13622400164604187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,4,power_law_1.2,0.424179220199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.01,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,balanced,0.044624000787734985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,4,power_law_1.2,0.5927487850189209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,balanced,0.20211732387542725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,4,power_law_1.2,0.9470784187316894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.01,0.04496639966964722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,balanced,0.04609066744645437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,4,power_law_1.2,1.2622655868530273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,balanced,0.9622720082600912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.01,0.05681279897689819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,balanced,0.24659732977549234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,4,power_law_1.2,1.6463552474975587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.01,0.05731199979782105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,4,power_law_1.2,2.3870208740234373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.01,0.05804799795150757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,balanced,0.35507198174794513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,4,power_law_1.2,3.2886337280273437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.01,0.057631999254226685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,4,power_law_1.2,5.5876415252685545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.01,0.06385279893875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,balanced,0.04611733555793762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,balanced,0.42563732465108234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.01,0.035545599460601804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,balanced,1.5532959302266438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.01,0.06314240097999572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,balanced,0.04933866858482361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,4,power_law_1.2,10.451897430419923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.01,0.03616639971733093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.01,0.0635968029499054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,balanced,0.05119466781616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,balanced,0.6165813207626343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.01,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.01,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,balanced,0.0518506666024526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,power_law_1.01,0.03059839904308319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.01,0.06895999908447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.01,0.04021120071411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,balanced,0.8105440139770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,power_law_1.01,0.03075839877128601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.01,0.07132800221443177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.01,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.01,0.0717311978340149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.01,0.08923519849777221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,power_law_1.01,0.03671680092811584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,balanced,0.06317866841952006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.01,0.045151999592781066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,balanced,1.00326935450236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.01,0.09902080297470092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,power_law_1.01,0.03804160058498383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,balanced,3.0061972935994468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,balanced,0.06613866488138835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.01,0.04705919921398163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.01,0.09562879800796509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,power_law_1.01,0.04142720103263855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,balanced,0.07116800049940745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.01,0.11752320528030395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.01,0.04857600033283234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,power_law_1.01,0.043558400869369504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.01,0.11940480470657348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,power_law_1.01,0.04619520008563995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.01,0.0489984005689621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,balanced,1.6176053682963054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.01,0.17081600427627563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.01,0.051526397466659546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,balanced,0.09274666508038838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.01,0.20373120307922363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,power_law_1.01,0.04827519953250885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.01,0.05406079888343811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.01,0.29631359577178956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,balanced,0.10162132978439331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,power_law_1.01,0.04835200011730194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.01,0.3463040113449097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.01,0.05675519704818725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.01,0.5381760120391845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.01,0.060108798742294314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.01,0.7037055969238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,power_law_1.01,0.05455999970436096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.01,0.06997759938240052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,power_law_1.01,0.05794559717178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.01,0.982483196258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.01,0.07898240089416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,balanced,0.14114666978518167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,power_law_1.01,0.0630400002002716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,balanced,3.26580810546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.01,0.07989760041236878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.01,1.1450816154479981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.01,0.09720960259437561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.01,1.3622336387634277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,balanced,0.18827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,power_law_1.01,0.06829439997673034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.01,0.11478400230407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.01,2.3337919235229494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,balanced,0.28566400210062665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.01,0.14162559509277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.01,4.45970573425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,balanced,0.3590453465779622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,power_law_1.01,0.07905920147895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.01,0.19802240133285523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,power_law_1.01,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,balanced,0.5238346656163534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.01,0.27525761127471926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,power_law_1.01,0.09717119932174682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.01,0.3148799896240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,balanced,0.6854720115661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.01,0.5081215858459472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,power_law_1.01,0.12164479494094849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.01,0.5699391841888428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,power_law_1.01,0.13325439691543578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,balanced,1.013002634048462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.01,0.8315008163452149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.01,1.1887807846069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,power_law_1.01,0.19155839681625367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,balanced,1.3436212539672852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.01,1.4254591941833497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,power_law_1.01,0.27000319957733154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.01,2.519584083557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,power_law_1.01,0.4140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,balanced,1.6796053250630696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.01,4.613491058349609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,power_law_1.01,0.5009727954864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,power_law_1.01,0.8293888092041015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,2,power_law_1.2,0.043782401084899905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,power_law_1.01,1.0262975692749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,2,power_law_1.2,0.044607999920845035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,power_law_1.01,1.4928447723388671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,2,power_law_1.2,0.0448063999414444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,balanced,2.6678454081217446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,power_law_1.01,2.110483169555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,2,power_law_1.2,0.056953597068786624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,power_law_1.01,2.7739391326904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,2,power_law_1.2,0.056959998607635495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,2,power_law_1.2,0.05749760270118713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,power_law_1.01,3.677260971069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,2,power_law_1.2,0.05923839807510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,2,power_law_1.2,0.058790397644042966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,power_law_1.01,9.318067169189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,2,power_law_1.2,0.06292480230331421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,2,power_law_1.2,0.06461439728736877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,balanced,5.298368136088054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,2,power_law_1.2,0.06435199975967407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,2,power_law_1.2,0.07066879868507385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,2,power_law_1.2,0.07284479737281799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,2,power_law_1.2,0.07136639952659607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,2,power_law_1.2,0.09397119879722596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,2,power_law_1.2,0.09823359847068787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,2,power_law_1.2,0.09341440200805665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,2,power_law_1.2,0.13164160251617432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,2,power_law_1.2,0.13226239681243895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,2,power_law_1.2,0.16699520349502564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,2,power_law_1.2,0.18931200504302978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,2,power_law_1.2,0.2865407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,2,power_law_1.2,0.3920831918716431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,2,power_law_1.2,0.03850879967212677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,2,power_law_1.2,0.565388822555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,2,power_law_1.2,0.03720960021018982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,2,power_law_1.2,0.6712704181671143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,2,power_law_1.2,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,2,power_law_1.2,0.9350015640258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,2,power_law_1.2,0.04226559996604919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,2,power_law_1.2,1.289900779724121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,2,power_law_1.2,0.043705600500106814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,2,power_law_1.2,1.6613119125366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,2,power_law_1.2,0.04595839977264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,2,power_law_1.2,0.0469760000705719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,2,power_law_1.2,0.04787200093269348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,2,power_law_1.2,2.225984001159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,2,power_law_1.2,0.05071359872817993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,2,power_law_1.2,4.553740692138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,2,power_law_1.2,0.030656000971794127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,2,power_law_1.2,0.05082880258560181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,2,power_law_1.2,0.05111680030822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,2,power_law_1.2,0.031065601110458373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,2,power_law_1.2,0.03264000117778778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,2,power_law_1.2,0.05820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,2,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,2,power_law_1.2,0.06088320016860962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,2,power_law_1.2,0.03849599957466125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,2,power_law_1.2,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,2,power_law_1.2,0.04224640130996704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,2,power_law_1.2,0.04405120015144348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,2,power_law_1.2,0.06962559819221496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,2,power_law_1.2,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,2,power_law_1.2,0.0784704029560089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,2,power_law_1.2,0.04787200093269348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,2,power_law_1.2,0.07854080200195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,2,power_law_1.2,0.04764800071716309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,2,power_law_1.2,0.0998528003692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,2,power_law_1.2,0.1182528018951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,2,power_law_1.2,0.05616639852523804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,2,power_law_1.2,0.14908159971237184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,2,power_law_1.2,0.05985280275344849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,2,power_law_1.2,0.1950592041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,2,power_law_1.2,0.06167680025100708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,2,power_law_1.2,0.2616192102432251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,2,power_law_1.2,0.06915839910507202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,2,power_law_1.2,0.32280960083007815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,2,power_law_1.2,0.5289984226226807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,2,power_law_1.2,0.0789247989654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,2,power_law_1.2,0.08517119884490967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,2,power_law_1.2,0.6615551948547364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,2,power_law_1.2,0.09380480051040649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,2,power_law_1.2,0.90829439163208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,2,power_law_1.2,0.1278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,2,power_law_1.2,1.1666560173034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,2,power_law_1.2,0.13448959589004517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,2,power_law_1.2,1.3269439697265626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,2,power_law_1.2,2.067193603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,2,power_law_1.2,0.20612480640411376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,2,power_law_1.2,4.442476654052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,2,power_law_1.2,0.3017791986465454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,2,power_law_1.2,0.46223998069763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,2,power_law_1.2,0.4987135887145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,2,power_law_1.2,0.7886271953582764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,2,power_law_1.2,1.060326385498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,2,power_law_1.2,1.560371208190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,balanced,0.19925334056218466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,2,power_law_1.2,1.8567935943603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,balanced,0.19604800144831339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,2,power_law_1.2,3.035686492919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,balanced,0.1930239995320638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,balanced,0.12071999907493591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,2,power_law_1.2,4.578540802001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,balanced,0.20139199495315552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,balanced,0.34618135293324787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,balanced,0.11729600032170613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,balanced,0.657807985941569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,2,power_law_1.2,9.650476837158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,balanced,0.12085866928100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,balanced,0.6923466523488363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,balanced,0.1239359974861145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,balanced,0.20880534251530966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,balanced,0.6697813669840494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,balanced,0.3691946665445964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,balanced,0.6454613208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,balanced,0.3633386691411336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,balanced,0.6591840187708536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,balanced,0.3638506730397542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,balanced,0.658181349436442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,balanced,0.36049067974090576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,balanced,0.6866719722747803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,balanced,0.37565334637959796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,balanced,0.6973439852396647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,balanced,0.3538186550140381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,balanced,0.6423199971516927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,balanced,0.36799999078114826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,balanced,0.6525386571884155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,balanced,0.37084798018137616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,balanced,0.35303465525309247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,balanced,0.6292479832967123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,balanced,0.3765386740366618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,balanced,0.6630026499430338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,balanced,0.36753066380818683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,balanced,0.6491573254267374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,balanced,0.3616746664047241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,balanced,0.5908693472544352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,balanced,0.36849598089853924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,balanced,0.6097066799799601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,balanced,0.3698720137278239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,balanced,0.05663466453552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,balanced,0.5862293243408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,balanced,0.3784960110982259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,balanced,0.054341331124305725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,balanced,0.05806933343410492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,balanced,0.5287786722183228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,balanced,0.3673706849416097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.6655424118041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.3624896049499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,balanced,0.07879466811815898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.6621823787689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.36204800605773924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,balanced,0.41619733969370526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,balanced,0.3725920120875041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,balanced,0.10215466221173604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.58853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.3221184015274048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,balanced,0.10288533568382263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.3429375886917114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,balanced,0.1039626697699229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.23067519664764405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,balanced,0.3338559865951538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,balanced,0.10428800185521443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.5180992126464844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.29575679302215574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,balanced,1.0145280361175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,balanced,0.10460799932479858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.3162048101425171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.597977590560913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,balanced,0.10647466778755188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.35484158992767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.6172544002532959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,balanced,0.6706773440043131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,balanced,0.1079253355662028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.5910975933074951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.32981119155883787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,balanced,0.10873066385587056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,balanced,0.7989652951558431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.5780928134918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.3468224048614502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,balanced,0.11027200023333232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.5963647842407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,balanced,0.11571733156840007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,balanced,0.5981599887212118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.3598207950592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.6558464050292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,balanced,0.1162559986114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.33018879890441893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.6394559860229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,balanced,0.12107732892036438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.358022403717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.6467135906219482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,balanced,1.115616003672282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.34172160625457765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.5940608024597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.339084792137146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.6117248058319091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,balanced,0.13010133306185404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,balanced,0.8706719875335693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.3276031970977783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.6139840126037598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.3308160066604614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.5410560131072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.3390336036682129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.6253824234008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.42559361457824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.7094783782958984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,balanced,1.5015145937601726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.5185023784637451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.9269696235656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,balanced,0.13994666934013367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.5528831958770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.01,0.9843008041381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,balanced,0.15684266885121664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,power_law_1.01,0.10131839513778687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.7451712131500244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,balanced,1.1483519872029622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.01,1.306272029876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.9428544044494629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,power_law_1.01,0.09716479778289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,balanced,0.17014400164286295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.01,1.6220096588134765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,1.4087424278259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.01,2.350912094116211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,power_law_1.01,0.0752128005027771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,1.920966339111328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,power_law_1.01,0.07796480059623719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.01,2.933401679992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,power_law_1.01,0.08196480274200439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,2.4274175643920897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.01,4.887200164794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,balanced,1.8694720268249512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,power_law_1.01,0.09225599765777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,balanced,0.20171199242273966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,3.209209442138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.01,6.504582214355469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,power_law_1.01,0.10089600086212158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.01,4.128121566772461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,power_law_1.01,0.09882879853248597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,balanced,1.42575470606486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.01,8.49130859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,balanced,0.22988265752792358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.01,7.059705352783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,power_law_1.01,0.10227199792861938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,power_law_1.01,0.10300159454345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.01,15.105459594726563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,power_law_1.01,0.10872960090637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.01,17.64849853515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,balanced,0.3046986659367879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,power_law_1.01,0.10956159830093384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,power_law_1.01,0.11143679618835449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.01,31.493240356445312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,power_law_1.01,0.12129919528961182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,power_law_1.01,0.13217920064926147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,balanced,0.3635093371073405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,power_law_1.01,0.13866879940032958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.6575488090515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,balanced,3.1721814473470054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,power_law_1.01,0.16619520187377929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.6492095947265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.3150719881057739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,power_law_1.01,0.1805567979812622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,balanced,2.3437280654907227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.403110408782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,balanced,0.5235733191172282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.40307202339172366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.01,0.17793279886245728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.46991357803344724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.01,0.24595839977264405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.6754176139831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.01,0.27022080421447753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.6195583820343018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.6054143905639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.01,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.5640192031860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.01,0.4520895957946777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.5888703823089599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,balanced,0.6848053137461344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.5568319797515869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.01,0.6248767852783204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.6331711769104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.01,0.7650879859924317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.3741312026977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.6298240184783935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.01,1.2370752334594726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.3565632104873657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.5790592193603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.01,1.6039936065673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.1780608057975769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.5547327995300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.23375999927520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,power_law_1.01,2.069875144958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.5347904205322266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.26375679969787597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.7744639873504638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.01,3.1133760452270507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.2851263999938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,balanced,0.8584106763203939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.9326144218444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.3216192007064819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,64,power_law_1.2,1.1567423820495606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.01,7.147571563720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.3540735960006714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,64,power_law_1.2,1.2545727729797362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.310918402671814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.3612096071243286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,64,power_law_1.2,1.7330368041992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,balanced,6.663536071777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.3074559926986694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,64,power_law_1.2,2.4163455963134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.31300480365753175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.31816959381103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,64,power_law_1.2,3.137676811218262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,balanced,4.849247932434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.3517823934555054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,64,power_law_1.2,4.442521667480468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.31813759803771974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.33885440826416013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,64,power_law_1.2,7.038995361328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.29386239051818847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,64,power_law_1.2,10.60268783569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.4652544021606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,balanced,1.3473866780598958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.44089598655700685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,64,power_law_1.2,12.374610900878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.5699776172637939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.7322879791259765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,64,power_law_1.2,23.75191650390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,0.9403136253356934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,1.4017279624938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,1.9963264465332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,2.5735679626464845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,64,power_law_1.2,42.02879943847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,3.705049514770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,4.6309761047363285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,64,power_law_1.2,5.776979064941406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,64,power_law_1.2,10.317164611816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,64,power_law_1.2,25.75374755859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,balanced,2.7185118993123374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,64,power_law_1.2,0.09973120093345642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,64,power_law_1.2,0.09507840275764465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,64,power_law_1.2,0.06728320121765137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,balanced,0.07229333122571309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,64,power_law_1.2,0.08152959942817688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,balanced,0.06759466727574666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,64,power_law_1.2,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,balanced,0.062234664956728615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,64,power_law_1.2,0.08727679848670959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,balanced,0.07541333138942719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,64,power_law_1.2,0.10280319452285766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,balanced,0.10564800103505452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,64,power_law_1.2,0.10181759595870972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,balanced,0.1607093314329783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,64,power_law_1.2,0.09435520172119141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,balanced,0.16082666317621866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,64,power_law_1.2,0.10772479772567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,balanced,0.16300800442695618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,64,power_law_1.2,0.1030784010887146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,balanced,0.1622880001862844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,balanced,0.16332800189654031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,64,power_law_1.2,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,balanced,0.16059199968973795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,64,power_law_1.2,0.11415679454803467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,balanced,0.16166933377583823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,64,power_law_1.2,0.1227455973625183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,balanced,0.16216533382733664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,64,power_law_1.2,0.14458240270614625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,balanced,0.16470932960510254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,64,power_law_1.2,0.14862719774246216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,balanced,0.169978658358256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,64,power_law_1.2,0.18210560083389282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,balanced,0.17013333241144815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,balanced,0.1792959968249003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,balanced,0.18571732441584268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,64,power_law_1.2,0.19683200120925903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,balanced,0.194432000319163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,balanced,0.20811732610066733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.2,0.19115519523620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,balanced,0.06003733476003011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.2,0.2592319965362549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,balanced,0.22741333643595377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.2,0.34812159538269044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,balanced,0.0505973349014918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,balanced,0.050800000627835594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,balanced,0.2505653301874797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.2,0.4294591903686523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,balanced,0.05735466877619425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,balanced,0.07964799801508586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.2,0.6238848209381104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,balanced,0.1060693363348643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,balanced,0.2807893355687459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.2,1.084819221496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,balanced,0.10852266351381938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,balanced,0.10857066512107849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.2,1.175443172454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,balanced,0.10946666200955708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,balanced,0.10994666814804077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.2,1.7331008911132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,balanced,0.34171199798583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.01,0.1701632022857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,balanced,0.11166399717330933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.2,2.37457275390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.01,0.14943360090255736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,balanced,0.11286399761835735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.01,0.11742719411849975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,balanced,0.11525866389274597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,64,power_law_1.2,2.872665596008301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.01,0.08812159895896912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,balanced,0.11680000027020772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.01,0.10952320098876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,balanced,0.12332266569137573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,balanced,0.40053868293762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.01,0.1195072054862976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.2,5.817203140258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,balanced,0.12556800246238708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.01,0.14878720045089722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,balanced,0.13058132926623026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.01,0.14841599464416505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,balanced,0.04599999884764353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,balanced,0.14121599992116293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.01,0.15038080215454103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.2,12.443590545654297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,balanced,0.04669333497683207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.01,0.15438079833984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,balanced,0.153029332558314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,balanced,0.04667733112970988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.01,0.14286719560623168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,balanced,0.05825066566467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,balanced,0.5507520039876302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.01,0.14132479429244996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,balanced,0.17575466632843018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,balanced,0.07935999830563863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.01,0.1603327989578247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,balanced,0.10222933689753215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.01,0.16868480443954467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,balanced,0.19833600521087646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.01,0.10730880498886108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,balanced,0.10451199611028035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.01,0.1684928059577942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,balanced,0.10479467113812764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.01,0.09756159782409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,balanced,0.23696533838907877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.01,0.8851136207580567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,balanced,0.10526399811108907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.01,0.0838271975517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.01,0.18673280477523804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,balanced,0.10611733794212341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.01,0.07013760209083557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,balanced,0.10774399836858113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.01,0.23138558864593506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,balanced,0.2799839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,balanced,0.6636000076929728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.01,0.08677759766578674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,balanced,0.10893332958221436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.01,0.2094912052154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,balanced,0.11034666498502095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.01,0.09191679954528809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.01,0.2682176113128662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,balanced,0.11245333154996236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.01,0.09687039852142335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,balanced,0.3627413511276245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.01,0.27487359046936033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,balanced,0.11917866269747417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.01,0.1028223991394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.01,0.34922239780426023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,balanced,0.11966400345166524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.01,0.10165760517120362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.01,0.44022397994995116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,balanced,0.12422933181126912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.01,0.10357120037078857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.01,0.5673088073730469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.01,0.10889600515365601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,balanced,0.44458667437235516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.01,0.7530303955078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.01,0.11023999452590942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,power_law_1.01,0.11290240287780762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.01,0.9856639862060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,balanced,0.8438826402028402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.01,0.11134079694747925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,power_law_1.01,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.01,0.11191040277481079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.01,1.2901247978210448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,balanced,0.13540800412495932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,power_law_1.01,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,32,power_law_1.2,0.17049599885940553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.01,0.12520320415496827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.01,1.5781760215759277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,power_law_1.01,0.0668287992477417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.01,0.13527679443359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,32,power_law_1.2,0.15009280443191528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,balanced,0.6289973258972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,32,power_law_1.2,0.0749504029750824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.01,2.249510383605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.01,0.13747199773788452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,power_law_1.01,0.08677120208740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,32,power_law_1.2,0.10026240348815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.01,0.15715839862823486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,power_law_1.01,0.08250880241394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,32,power_law_1.2,0.09841920137405395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.01,5.056281661987304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.01,0.1694591999053955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,power_law_1.01,0.09572479724884034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,32,power_law_1.2,0.11890560388565063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,32,power_law_1.2,0.152019202709198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.01,0.21301119327545165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,power_law_1.01,0.09921919703483581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,balanced,0.1469493309656779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,32,power_law_1.2,0.14401919841766359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.01,0.22671360969543458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,power_law_1.01,0.09943040013313294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,32,power_law_1.2,0.15279359817504884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,balanced,0.164901336034139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.01,0.3178112030029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,power_law_1.01,0.09996160268783569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,32,power_law_1.2,0.15733760595321655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,balanced,0.7906986872355143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.01,0.3508863925933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,32,power_law_1.2,0.14897279739379882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,balanced,0.1824480096499125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,power_law_1.01,0.10168960094451904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,32,power_law_1.2,0.15767680406570433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.01,0.4815552234649658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,power_law_1.01,0.10655360221862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,balanced,1.217098633448283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,32,power_law_1.2,0.16759040355682372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.01,0.6332032203674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,power_law_1.01,0.11603200435638428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,32,power_law_1.2,0.1538879990577698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.01,0.9526016235351562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,32,power_law_1.2,1.117587184906006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,power_law_1.01,0.11773439645767211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,32,power_law_1.2,1.135103988647461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.01,1.1561599731445313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,balanced,0.22176533937454224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,power_law_1.01,0.13140480518341063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,32,power_law_1.2,0.2059391975402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.01,1.4045568466186524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,32,power_law_1.2,0.24682879447937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,power_law_1.01,0.13615360260009765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,32,power_law_1.2,0.23021440505981444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,balanced,0.2553973396619161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,power_law_1.01,0.15229439735412598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.01,2.15548152923584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,32,power_law_1.2,0.2906559944152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,balanced,0.990074634552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,32,power_law_1.2,0.34165120124816895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.01,4.362566375732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,32,power_law_1.2,0.4414527893066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,power_law_1.01,0.17521920204162597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,32,power_law_1.2,0.512940788269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,balanced,0.35552533467610675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,32,power_law_1.2,0.6518464088439941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,32,power_law_1.2,0.8634048461914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,power_law_1.01,0.17935999631881713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,32,power_law_1.2,1.4165056228637696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,power_law_1.01,0.2302016019821167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,balanced,0.4399413267771403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,32,power_law_1.2,1.6922111511230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,power_law_1.01,0.25768959522247314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,32,power_law_1.2,1.8740671157836915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,32,power_law_1.2,3.211276626586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,power_law_1.01,0.37420799732208254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,power_law_1.01,0.43848958015441897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,power_law_1.2,7.222259521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,power_law_1.01,0.5913919925689697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,power_law_1.01,0.8283840179443359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,balanced,1.5037546157836914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,balanced,0.6323893467585245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,power_law_1.01,1.2643712043762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,power_law_1.01,1.829587173461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,power_law_1.01,1.952396774291992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,32,balanced,2.4779626528422036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,power_law_1.01,3.1710208892822265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,power_law_1.01,6.4739837646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,balanced,0.8233813444773356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,balanced,1.0123786926269531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,32,power_law_1.2,0.10802559852600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,32,power_law_1.2,0.09938560128211975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,32,power_law_1.2,0.062457597255706786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,32,power_law_1.2,0.06684160232543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,32,power_law_1.2,0.07801600098609925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,32,power_law_1.2,0.0885312020778656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,32,power_law_1.2,0.10311039686203002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,balanced,2.9713493982950845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,32,power_law_1.2,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,32,power_law_1.2,0.10268160104751586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,balanced,1.5979199409484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,32,power_law_1.2,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,32,power_law_1.2,0.10168960094451904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,32,power_law_1.2,0.10861439704895019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,32,power_law_1.2,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,32,power_law_1.2,0.12127360105514526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,32,power_law_1.2,0.12885760068893432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,32,power_law_1.2,0.13767679929733276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,32,power_law_1.2,0.14358400106430053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,32,power_law_1.2,0.16959359645843505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,32,power_law_1.2,0.18609280586242677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,32,power_law_1.2,0.23084800243377684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,32,power_law_1.2,0.25194880962371824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,32,power_law_1.2,0.34143359661102296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,32,power_law_1.2,0.42500481605529783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,32,power_law_1.2,0.5737792015075683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,32,power_law_1.2,0.7047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,32,power_law_1.2,1.2045184135437013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,32,power_law_1.2,1.5780415534973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,32,power_law_1.2,2.161235237121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,32,power_law_1.2,0.10369919538497925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,32,power_law_1.2,3.0667648315429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,32,power_law_1.2,0.09943680167198181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,32,power_law_1.2,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,balanced,3.2197386423746743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,32,power_law_1.2,6.82336654663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,32,power_law_1.2,0.07417600154876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,32,power_law_1.2,0.07653759717941284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,32,power_law_1.2,0.08140159845352173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,32,power_law_1.2,0.09752320051193238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,32,power_law_1.2,0.0943615972995758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,32,power_law_1.2,0.0980351984500885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,32,power_law_1.2,0.10451840162277222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,32,power_law_1.2,0.10595200061798096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,balanced,0.05842133363087972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,32,power_law_1.2,0.10885119438171387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,32,power_law_1.2,0.11095679998397827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,balanced,0.05638933181762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,balanced,0.06172266602516174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,32,power_law_1.2,0.12233599424362182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,balanced,0.07548266649246216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,balanced,0.10506133238474528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,32,power_law_1.2,0.13139840364456176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,balanced,0.1592639982700348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,32,power_law_1.2,0.14149119853973388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,balanced,0.16171200076738992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,balanced,0.048911998669306435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,32,power_law_1.2,0.16763520240783691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,balanced,0.15896000464757284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,balanced,0.15944000085194907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,balanced,0.04978133241335551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,balanced,0.15985600153605142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,balanced,0.05023466547330221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,balanced,0.16169599692026773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,32,power_law_1.2,0.18322559595108032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,balanced,0.16234133640925089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,balanced,0.07762666543324788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,balanced,0.10735467076301575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,balanced,0.16386666893959045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,32,power_law_1.2,0.18746880292892457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,balanced,0.11060266693433125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,balanced,0.16536532839139303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,balanced,0.11037866274515788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,32,power_law_1.2,0.2430272102355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,balanced,0.17108800013860068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,balanced,0.11133866508801778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,32,power_law_1.2,0.29553918838500975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,balanced,0.17223999897638956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.01,0.11301120519638061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,balanced,0.11358400185902913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,balanced,0.18178133169809976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.01,0.15525120496749878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,balanced,0.11408000191052754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,32,power_law_1.2,0.40320000648498533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.01,0.08325120210647582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,balanced,0.1902559995651245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,balanced,0.11533332864443462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,32,power_law_1.2,0.5051136016845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.01,0.07952640056610108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,balanced,0.20062933365503946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,balanced,0.11821333567301433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.01,0.09628159999847412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,32,power_law_1.2,0.7579328060150147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,balanced,0.04655466477076212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.01,0.11409280300140381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,balanced,0.11942399541536967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,balanced,0.2213653326034546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,32,power_law_1.2,1.1408448219299316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,balanced,0.04706133405367533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.01,0.13390719890594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,balanced,0.048528000712394714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,balanced,0.12632532914479574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,balanced,0.06278933087984721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,balanced,0.24203733603159586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,balanced,0.12757866581281027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.01,0.13709440231323242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,balanced,0.0769760012626648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,32,power_law_1.2,1.8139904022216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,balanced,0.10457066694895427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,balanced,0.13455466429392496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.01,0.13968000411987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,32,power_law_1.2,1.9421951293945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,balanced,0.1071573297182719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,balanced,0.2712480028470357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,balanced,0.14739200472831726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.01,0.14075520038604736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,balanced,0.10760533809661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,32,power_law_1.2,3.1756799697875975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,balanced,0.10827199618021648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,balanced,0.16364266475041708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,balanced,0.10876799623171489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.01,0.1470080018043518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,balanced,0.30984532833099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,balanced,0.1109386682510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,32,power_law_1.2,5.008633422851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,balanced,0.18548800547917685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,balanced,0.11246400078137715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.01,0.15418879985809325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,balanced,0.11382933457692464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,balanced,0.2119093338648478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,32,power_law_1.2,10.084518432617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,balanced,0.11590933799743652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.01,0.15420160293579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,balanced,0.37589867909749347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,balanced,0.12292266885439555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.01,0.16069120168685913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,balanced,0.12501866618792215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,balanced,0.2546079953511556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,balanced,0.13074666261672974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.01,0.16984959840774536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.01,0.07651200294494628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.01,0.6517632007598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,balanced,0.30592532952626544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,balanced,0.46693865458170575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.01,0.10110080242156982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.01,0.19608960151672364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.01,0.06803200244903565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.01,0.2096127986907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,balanced,0.14546133081118265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.01,0.06739839911460876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.01,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,balanced,0.39479466279347736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.01,0.2250368118286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.01,0.07975680232048035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.01,0.26714239120483396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.01,0.09571200013160705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.01,0.2763583898544312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,balanced,0.6429866552352905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.01,0.09511680006980897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.01,0.10157439708709717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.01,0.34965760707855226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,balanced,0.5044159889221191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.01,0.10213760137557984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.01,0.41680002212524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,balanced,0.16545066237449646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.01,0.10496000051498414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.01,0.511571216583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.01,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,balanced,0.1906933387120565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.01,0.6999743938446045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.01,0.11110399961471558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.01,0.9669759750366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.01,0.11963520050048829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,balanced,0.2105706731478373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.01,1.1965951919555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.01,0.12465920448303222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,balanced,0.7076853116353353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.01,1.5349632263183595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,balanced,0.8035786946614584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.01,0.12700799703598023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,balanced,0.2733493248621623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.01,0.13657599687576294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.01,2.1182655334472655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.01,0.15479040145874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.01,0.17593599557876588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.01,5.016729736328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,balanced,0.33108800649642944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.01,0.20597760677337645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.01,0.24773120880126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.01,0.3077440023422241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.01,0.3599103927612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,balanced,0.4742186864217122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,balanced,0.8708373705546061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.01,0.5127935886383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.01,0.6340672016143799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,balanced,1.0190186500549316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.01,0.9487744331359863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.01,1.2621631622314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,balanced,0.5797173182169596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.01,1.4934080123901368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.01,2.1614400863647463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.01,4.733868789672852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,balanced,1.112170696258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,balanced,0.8388426303863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,16,power_law_1.2,0.11300480365753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,16,power_law_1.2,0.15337599515914918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,power_law_1.01,0.07835519909858704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,16,power_law_1.2,0.06480640172958374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,balanced,1.4393067359924316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,16,power_law_1.2,0.08815360069274902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,power_law_1.01,0.10625920295715333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,16,power_law_1.2,0.08917120099067688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,balanced,1.092725356419881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,power_law_1.01,0.07191680073738098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,16,power_law_1.2,0.10684800148010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,power_law_1.01,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,16,power_law_1.2,0.1290112018585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,power_law_1.01,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,16,power_law_1.2,0.14266879558563234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,power_law_1.01,0.08762879967689514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,16,power_law_1.2,0.13911039829254152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,power_law_1.01,0.0976960003376007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,power_law_1.01,0.09834880232810975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,16,power_law_1.2,0.1376960039138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,balanced,1.6765546798706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,power_law_1.01,0.10290559530258178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,16,power_law_1.2,0.14780160188674926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,power_law_1.01,0.10392960309982299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,16,power_law_1.2,0.14594559669494628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,power_law_1.01,0.10444799661636353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,power_law_1.01,0.11580799818038941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,16,power_law_1.2,0.15971200466156005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,balanced,1.3562080065409343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,power_law_1.01,0.11707520484924316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,16,power_law_1.2,0.1675968050956726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,power_law_1.01,0.12383359670639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,16,power_law_1.2,1.3763263702392579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,power_law_1.01,0.13139840364456176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,power_law_1.01,0.14482560157775878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,16,power_law_1.2,1.3675264358520507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,power_law_1.01,0.15137280225753785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,16,power_law_1.2,0.19901440143585206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,16,power_law_1.2,0.22048640251159668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,16,power_law_1.2,0.23402879238128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,power_law_1.01,0.1794111967086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,16,power_law_1.2,0.3021183967590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,16,power_law_1.2,0.30071680545806884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,power_law_1.01,0.19283839464187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,16,power_law_1.2,0.39752318859100344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,16,power_law_1.2,0.48993921279907227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,power_law_1.01,0.24579839706420897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,power_law_1.01,0.3024832010269165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,16,power_law_1.2,0.6631103992462158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,power_law_1.01,0.4038400173187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,16,power_law_1.2,0.7521088123321533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,power_law_1.01,0.4815231800079346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,balanced,2.1458452542622886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,power_law_1.01,0.6863615989685059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,16,power_law_1.2,1.239776039123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,balanced,2.796090761820475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,power_law_1.01,0.9346431732177735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,16,power_law_1.2,1.5141695976257323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,power_law_1.01,1.3676735877990722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,power_law_1.01,2.114713668823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,16,power_law_1.2,1.9788991928100585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,power_law_1.01,2.3022783279418944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,16,power_law_1.2,3.1838464736938477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,power_law_1.01,3.8050750732421874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,16,power_law_1.2,6.041932678222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,balanced,3.324437459309896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,power_law_1.01,7.206956481933593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,16,power_law_1.2,0.07694720029830933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,16,power_law_1.2,0.10088319778442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,16,power_law_1.2,0.05490559935569763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,16,power_law_1.2,0.06178560256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,16,power_law_1.2,0.07449600100517273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,16,power_law_1.2,0.08230400085449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,16,power_law_1.2,0.0958400011062622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,16,power_law_1.2,0.09838079810142517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,16,power_law_1.2,0.10172159671783447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,16,power_law_1.2,0.09831680059432983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,16,power_law_1.2,0.1064255952835083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,balanced,4.282346725463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,16,power_law_1.2,0.1078336000442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,16,power_law_1.2,0.11329920291900634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,16,power_law_1.2,0.12020479440689087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,16,power_law_1.2,0.12997119426727294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,16,power_law_1.2,0.07738239765167236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,16,power_law_1.2,0.13494399785995484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,16,power_law_1.2,0.14032000303268433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,16,power_law_1.2,0.10604159832000733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,16,power_law_1.2,0.16900479793548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,16,power_law_1.2,0.05441920161247253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,16,power_law_1.2,0.064300799369812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,16,power_law_1.2,0.18280960321426393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,16,power_law_1.2,0.06804479956626892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,16,power_law_1.2,0.2262655973434448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,16,power_law_1.2,0.08365439772605895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,16,power_law_1.2,0.27127039432525635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,16,power_law_1.2,0.09505280256271362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,16,power_law_1.2,0.09890559911727906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,16,power_law_1.2,0.35262720584869384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,16,power_law_1.2,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,16,power_law_1.2,0.4094655990600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,16,power_law_1.2,0.10266879796981812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,balanced,0.05638400216897329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,16,power_law_1.2,0.108787202835083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,16,power_law_1.2,0.5853695869445801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,balanced,0.05602666735649109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,balanced,0.06116800010204315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,16,power_law_1.2,0.11521279811859131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,16,power_law_1.2,0.6781631946563721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,balanced,0.07614933451016744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,16,power_law_1.2,0.11906559467315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,16,power_law_1.2,0.9411968231201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,balanced,0.10700266559918721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,16,power_law_1.2,0.12741760015487671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,16,power_law_1.2,1.608083152770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,balanced,0.16194666425387064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,16,power_law_1.2,0.14072959423065184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,balanced,0.16274666786193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,16,power_law_1.2,1.6511999130249024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,16,power_law_1.2,0.14737279415130616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,balanced,0.1609440048535665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,16,power_law_1.2,0.1674880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,16,power_law_1.2,2.787596893310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,balanced,0.16110400358835855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,balanced,0.16266666849454245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,16,power_law_1.2,5.646278381347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,balanced,0.16513066490491232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,16,power_law_1.2,0.1968832015991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,balanced,0.17194666465123495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,balanced,0.16745599110921225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,16,power_law_1.2,0.21846399307250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,balanced,0.17010666926701865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,16,power_law_1.2,0.2863296031951904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,balanced,0.17669866482416788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,16,power_law_1.2,0.33415679931640624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,balanced,0.17784533898035684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,16,power_law_1.2,0.46304001808166506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,16,power_law_1.2,0.6590400218963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,balanced,0.18478933970133463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,16,power_law_1.2,0.8847040176391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,balanced,0.19782400131225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,16,power_law_1.2,1.2085439682006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,balanced,0.2209706703821818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,16,power_law_1.2,1.948691177368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,balanced,0.246778666973114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,16,power_law_1.2,2.2056447982788088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,16,power_law_1.2,2.5594560623168947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,balanced,0.2669546604156494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,16,power_law_1.2,4.319820785522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,balanced,0.31464533011118573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,16,power_law_1.2,9.385491180419923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,balanced,0.3676106532414754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,balanced,0.4660853147506714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,balanced,0.6263039906819662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,balanced,0.047914668917655945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,balanced,0.04860800007979075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.01,0.07775999903678894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,balanced,0.05124266445636749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,balanced,0.06155199805895487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.01,0.1080064058303833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,balanced,0.0807360013326009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.01,0.07280640006065368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,balanced,0.10977600018183391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.01,0.07726719975471497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.01,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,balanced,0.8703359762827555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,balanced,0.11201066772143047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.01,0.09442560076713562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,balanced,0.11229333281517029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.01,0.07682560086250305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,balanced,0.11343466242154439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.01,0.11071360111236572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.01,0.05777279734611511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,balanced,0.11437867085138957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.01,0.13432320356369018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.01,0.06236159801483154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,balanced,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.01,0.13115520477294923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,balanced,0.05206400156021118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,balanced,0.11926399668057759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.01,0.07453439831733703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.01,0.139136004447937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,balanced,0.05392000079154968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,balanced,0.12264000376065572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.01,0.08199679851531982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.01,0.14186880588531495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,balanced,0.06836799780527751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,balanced,0.12332800030708313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.01,0.09690880179405212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,balanced,0.08546666304270427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.01,0.14750720262527467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,balanced,1.0275306701660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,balanced,0.1321440041065216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.01,0.09641600251197815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,balanced,0.11474133531252544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.01,0.15279359817504884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,balanced,0.1344480017820994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,balanced,0.11652800440788269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.01,0.10254720449447632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.01,0.1556864023208618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,balanced,0.11802132924397786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,balanced,0.14293866356213888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.01,0.1027008056640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,balanced,0.11956800023714702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.01,0.17107199430465697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,balanced,0.1585973302523295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.01,0.10623359680175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,balanced,0.12078932921091716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.01,0.17754240036010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,balanced,0.12226133545239766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.01,0.1088703989982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,balanced,0.17789334058761597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,balanced,0.12441600362459819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.01,0.8868096351623536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.01,0.11360640525817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,balanced,0.2089759906133016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,balanced,0.1284213364124298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.01,1.3694208145141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.01,0.12136319875717164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,balanced,0.1309760014216105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.01,0.13160320520401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.01,1.3911104202270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,balanced,0.2342080076535543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,balanced,1.298746665318807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.01,0.13697919845581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,balanced,0.13962666193644205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.01,0.23761279582977296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.01,0.14413440227508545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,balanced,0.14286399881045023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,balanced,0.2927253246307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.01,0.16927360296249389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.01,0.2634239912033081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,balanced,0.15333333611488342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.01,0.1898687958717346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,power_law_1.01,0.06999040246009827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.01,0.3057152032852173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.01,0.22464640140533448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.01,0.4085440158843994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,power_law_1.01,0.08257279992103576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,balanced,0.3566879828770955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.01,0.2687743902206421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,power_law_1.01,0.056979197263717654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.01,0.4501952171325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.01,0.35658879280090333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.01,0.5675712108612061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,power_law_1.01,0.06815360188484192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.01,0.42414078712463377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,balanced,0.17430933316548666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.01,0.570527982711792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,power_law_1.01,0.07402240037918091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.01,0.7600639820098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,balanced,0.4797439972559611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.01,0.7537216186523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,power_law_1.01,0.08638719916343689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.01,1.038649559020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,power_law_1.01,0.10122879743576049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.01,1.077228832244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.01,1.4141823768615722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,power_law_1.01,0.10805759429931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.01,1.4355839729309081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.01,1.5803839683532714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,power_law_1.01,0.10542720556259155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,balanced,0.6341919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.01,1.639788818359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,balanced,0.20371200640996298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.01,2.6639999389648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,power_law_1.01,0.11279360055923462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,balanced,1.8310559590657551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.01,2.6699455261230467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,balanced,0.2515733242034912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,power_law_1.01,0.11804159879684448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.01,4.762540817260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.01,5.958252716064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,power_law_1.01,0.1257151961326599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,balanced,0.29099200169245404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,power_law_1.01,0.1317952036857605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,balanced,0.9132106304168701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,power_law_1.01,0.14258559942245483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,balanced,0.3998719851175944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,power_law_1.01,0.15118720531463622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,power_law_1.01,0.16022399663925171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,balanced,0.4773706595102946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,power_law_1.01,0.1832128047943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,power_law_1.01,0.20851199626922606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,balanced,0.7173333168029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,balanced,1.1152479648590088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,power_law_1.01,0.2450176000595093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,power_law_1.01,0.29373440742492674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,balanced,0.8856800397237142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,8,power_law_1.2,0.07848320007324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,power_law_1.01,0.38689920902252195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,8,power_law_1.2,0.10614399909973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,power_law_1.01,0.5124159812927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,8,power_law_1.2,0.06213120222091675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,8,power_law_1.2,0.07574399709701538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,power_law_1.01,0.6665535926818847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,8,power_law_1.2,0.08580480217933655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,balanced,1.4090186754862468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,power_law_1.01,0.9376319885253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,balanced,1.271999994913737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,8,power_law_1.2,0.10392960309982299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,power_law_1.01,1.2377728462219237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,8,power_law_1.2,0.13504639863967896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,power_law_1.01,1.6850048065185548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,8,power_law_1.2,0.13101439476013182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,8,power_law_1.2,0.13524479866027833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,power_law_1.01,2.2967872619628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,8,power_law_1.2,0.1433087944984436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,balanced,3.5935840606689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,power_law_1.01,2.7208320617675783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,8,power_law_1.2,0.1552448034286499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,8,power_law_1.2,0.14911359548568726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,balanced,1.663248062133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,power_law_1.01,4.761491012573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,8,power_law_1.2,0.15897599458694459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,8,power_law_1.2,0.060127997398376466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,8,power_law_1.2,0.17091200351715088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,power_law_1.01,10.561074829101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,8,power_law_1.2,1.1341823577880858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,8,power_law_1.2,0.07756800055503846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,8,power_law_1.2,1.3672896385192872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,8,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,balanced,2.117578665415446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,8,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,8,power_law_1.2,1.393836784362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,8,power_law_1.2,0.07046399712562561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,8,power_law_1.2,1.4263808250427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,8,power_law_1.2,0.07599999904632568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,8,power_law_1.2,0.2527424097061157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,balanced,2.058330694834391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,8,power_law_1.2,0.09731839895248413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,8,power_law_1.2,0.28085761070251464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,8,power_law_1.2,0.09527040123939515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,8,power_law_1.2,0.31619839668273925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,8,power_law_1.2,0.10252799987792968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,8,power_law_1.2,0.4066688060760498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,8,power_law_1.2,0.10255359411239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,8,power_law_1.2,0.4991168022155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,8,power_law_1.2,0.10547840595245361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,8,power_law_1.2,0.5865407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,8,power_law_1.2,0.11015679836273193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,8,power_law_1.2,0.8564543724060059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,8,power_law_1.2,0.1180351972579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,8,power_law_1.2,1.1387840270996095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,8,power_law_1.2,0.13178880214691163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,8,power_law_1.2,1.6987199783325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,8,power_law_1.2,0.14050559997558593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,8,power_law_1.2,0.14551039934158325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,8,power_law_1.2,2.1104703903198243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,8,power_law_1.2,0.14731520414352417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,8,power_law_1.2,2.5993152618408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,8,power_law_1.2,0.18287999629974366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,balanced,3.2517334620157876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,8,power_law_1.2,0.19245439767837524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,8,power_law_1.2,7.262355041503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,8,power_law_1.2,0.24484479427337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,8,power_law_1.2,0.2782464027404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,8,power_law_1.2,0.34842240810394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,8,power_law_1.2,0.47403521537780763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,8,power_law_1.2,0.6554175853729248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,balanced,4.142719904581706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,8,power_law_1.2,0.8059840202331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,8,power_law_1.2,1.1833855628967285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,8,power_law_1.2,1.569696044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,8,power_law_1.2,1.8731584548950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,8,power_law_1.2,3.0950271606445314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,8,power_law_1.2,6.727033233642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,balanced,0.056015998125076294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,8,power_law_1.2,0.07008640170097351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,balanced,0.05641599992911021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,balanced,0.06309866905212402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,8,power_law_1.2,0.08055040240287781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,balanced,6.474847793579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,8,power_law_1.2,0.05740799903869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,balanced,0.07810666660467784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,8,power_law_1.2,0.07174400091171265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,balanced,0.11074666182200114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,balanced,0.16949333747227988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,8,power_law_1.2,0.0743552029132843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,balanced,0.17082667350769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,8,power_law_1.2,0.08389120101928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,balanced,0.1684373418490092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,8,power_law_1.2,0.09909759759902954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,balanced,0.16943466663360596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,8,power_law_1.2,0.10517760515213012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,balanced,0.17337600390116373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,8,power_law_1.2,0.10969599485397338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,balanced,0.17468800147374472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,8,power_law_1.2,0.11315840482711792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,balanced,0.17955732345581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,8,power_law_1.2,0.11518080234527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,balanced,0.18023999532063803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,8,power_law_1.2,0.12488960027694702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,balanced,0.1866933306058248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,8,power_law_1.2,0.13204480409622193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,balanced,0.1957333286603292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,8,power_law_1.2,0.14161920547485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,balanced,0.197269340356191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,8,power_law_1.2,0.15214719772338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,balanced,0.20722132921218872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,8,power_law_1.2,0.17402880191802977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,balanced,0.2256960074106852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,8,power_law_1.2,0.1960319995880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,balanced,0.252618670463562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,8,power_law_1.2,0.22055680751800538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,balanced,0.2927253246307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,balanced,0.3239786624908447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,8,power_law_1.2,0.2625216007232666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,8,power_law_1.2,0.33152639865875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,balanced,0.4044479926427205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,8,power_law_1.2,0.41658878326416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,8,power_law_1.2,0.5779263973236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,8,power_law_1.2,0.7730048179626465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,balanced,0.49906667073567706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,8,power_law_1.2,0.9797375679016114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,balanced,0.049173335234324135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,8,power_law_1.2,1.313100814819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,8,power_law_1.2,2.358195114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,balanced,0.050581331054369606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,balanced,0.6714133421579996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,8,power_law_1.2,2.469536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,balanced,0.05362666646639506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,balanced,0.06569066643714905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,8,power_law_1.2,3.7899967193603517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,balanced,0.08806399504343669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,balanced,0.1256533364454905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,8,power_law_1.2,5.512057495117188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,balanced,0.8654293219248453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,balanced,0.12773866454760233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,balanced,0.12794133027394614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,8,power_law_1.2,13.124345397949218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,balanced,0.06227200229962667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,balanced,0.06659199794133504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,balanced,0.12800533572832742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,balanced,0.08021866778532664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,balanced,0.1297546625137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,balanced,0.10327999790509541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,balanced,0.13244799772898355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,balanced,0.13876799742380777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,balanced,1.2225386301676433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,balanced,0.14198933045069376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,balanced,0.13555733362833658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,balanced,0.14421332875887552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,balanced,0.13802666465441385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,balanced,0.14648000399271646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,balanced,0.14164800445238748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,balanced,0.14844266573588052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,balanced,0.15150400002797446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,balanced,0.15067733327547708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,balanced,0.1557919979095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,balanced,0.15411733587582907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,balanced,0.16077867150306702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,balanced,0.16435733437538147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,balanced,0.16781334082285562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,balanced,0.18556267023086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,balanced,1.4622079531351726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,balanced,0.18204265832901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.01,0.06202239990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,balanced,0.212501327196757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,balanced,0.1872640053431193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.01,0.08014079928398132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,balanced,0.19734932978947958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,balanced,0.24830933411916098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.01,0.0643392026424408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.01,0.07455999851226806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,balanced,0.2858346700668335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.01,0.09191679954528809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,balanced,0.23736000061035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,balanced,0.37586132685343426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.01,0.11032320261001587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.01,0.1386944055557251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.01,0.052134400606155394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.01,0.13667839765548706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,balanced,1.8534986178080242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,balanced,0.4699680010477702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.01,0.06417919993400574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.01,0.14357759952545165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.01,0.05923839807510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.01,0.145907199382782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,balanced,0.30721600850423175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.01,0.06247680187225342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.01,0.1539520025253296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,balanced,0.6579146782557169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.01,0.07453439831733703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,balanced,0.3910026550292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.01,0.1617535948753357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.01,0.08597760200500489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.01,0.17123199701309205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,balanced,0.44631465276082355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.01,0.10366079807281495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.01,0.18103040456771852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,balanced,0.856282631556193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.01,0.11065599918365479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.01,0.1996608018875122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,balanced,0.6338186661402384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.01,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.01,0.2075455904006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,power_law_1.01,0.0671231985092163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.01,0.11584000587463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.01,1.3971263885498046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,power_law_1.01,0.07803519964218139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,balanced,0.7620320320129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.01,0.11980160474777221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.01,1.4320063591003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.01,0.1255295991897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,power_law_1.01,0.0693120002746582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.01,1.4850879669189454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.01,0.12883199453353883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,power_law_1.01,0.07894399762153625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,balanced,1.2437653541564941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,balanced,2.784661293029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.01,0.14048000574111938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.01,2.2482816696166994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,balanced,1.156773328781128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,power_law_1.01,0.08865919709205627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.01,0.15215359926223754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.01,0.3584000110626221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,power_law_1.01,0.10319360494613647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.01,0.1583680033683777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.01,0.4404032230377197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,power_law_1.01,0.11887999773025512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.01,0.17420799732208253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.01,0.5969664096832276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,power_law_1.01,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.01,0.20154240131378173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,balanced,1.4405226707458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.01,0.7646848201751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,power_law_1.01,0.13167359828948974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.01,0.22759039402008058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,power_law_1.01,0.1338047981262207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.01,0.9750847816467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.01,0.27076480388641355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,balanced,1.51420259475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,power_law_1.01,0.1434816002845764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.01,0.31342079639434817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.01,1.4091903686523437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,4,power_law_1.2,0.06219519972801209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,power_law_1.01,0.1525887966156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.01,0.41170558929443357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.01,1.6800960540771483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,4,power_law_1.2,0.07931519746780395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,power_law_1.01,0.16035840511322022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.01,0.5329216003417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,balanced,2.11734930674235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,4,power_law_1.2,0.06321280002593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.01,2.0357759475708006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,power_law_1.01,0.1805184006690979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.01,0.6967423915863037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,4,power_law_1.2,0.07041280269622803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,power_law_1.01,0.19331200122833253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.01,0.9276991844177246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,4,power_law_1.2,0.08421120047569275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.01,3.4825279235839846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,power_law_1.01,0.20079360008239747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,4,power_law_1.2,0.10394879579544067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.01,1.351859188079834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,power_law_1.01,0.22916479110717775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,4,power_law_1.2,0.13056000471115112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.01,7.194924926757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.01,1.7361919403076171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,4,power_law_1.2,0.13471360206604005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,balanced,1.9257814089457195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,4,power_law_1.2,0.14058239459991456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.01,2.1620607376098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,power_law_1.01,0.29760639667510985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,4,power_law_1.2,0.1463039994239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,balanced,2.7894134521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,4,power_law_1.2,0.1552448034286499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.01,3.670073699951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,4,power_law_1.2,0.16518399715423585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,power_law_1.01,0.34330880641937256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,4,power_law_1.2,0.1780608057975769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.01,6.9049537658691404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,4,power_law_1.2,0.1933184027671814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,power_law_1.01,0.4347839832305908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,4,power_law_1.2,0.2035072088241577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,power_law_1.01,0.5423999786376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,4,power_law_1.2,0.20805759429931642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,4,power_law_1.2,1.4095487594604492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,power_law_1.01,0.7497663974761963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,4,power_law_1.2,1.4439552307128907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,power_law_1.01,0.9569919586181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,4,power_law_1.2,2.2098880767822267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,power_law_1.01,1.398195171356201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,4,power_law_1.2,2.5314815521240233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,balanced,3.4728320439656577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,balanced,5.438394546508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,4,power_law_1.2,0.36583681106567384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,power_law_1.01,1.7843135833740233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,4,power_law_1.2,0.45240960121154783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,power_law_1.01,2.652787208557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,balanced,2.937434514363607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,4,power_law_1.2,0.650432014465332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,power_law_1.01,3.360006332397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,4,power_law_1.2,0.836025619506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,power_law_1.01,4.438438415527344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,4,power_law_1.2,1.0240127563476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,4,power_law_1.2,1.4530943870544433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,power_law_1.01,6.652365112304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,4,power_law_1.2,1.981439971923828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,4,power_law_1.2,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,power_law_1.01,13.44322509765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,4,power_law_1.2,2.357107162475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,4,power_law_1.2,0.06421759724617004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,4,power_law_1.2,0.05386880040168762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,4,power_law_1.2,3.794617462158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,4,power_law_1.2,0.06213120222091675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,balanced,5.497061411539714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,4,power_law_1.2,0.07349119782447815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,4,power_law_1.2,7.792851257324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,4,power_law_1.2,0.08524799942970276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,4,power_law_1.2,0.10279680490493774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,4,power_law_1.2,0.1058303952217102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,4,power_law_1.2,0.11147520542144776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,4,power_law_1.2,0.11534719467163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,4,power_law_1.2,0.12055679559707641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,4,power_law_1.2,0.12774399518966675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,4,power_law_1.2,0.13294719457626342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,4,power_law_1.2,0.14286719560623168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,4,power_law_1.2,0.15438719987869262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,4,power_law_1.2,0.16442240476608277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,4,power_law_1.2,0.18259840011596679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,4,power_law_1.2,0.21062400341033935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,4,power_law_1.2,0.23269119262695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,balanced,5.812431971232097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,4,power_law_1.2,0.2800447940826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,4,power_law_1.2,0.3274944067001343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,4,power_law_1.2,0.4250944137573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,4,power_law_1.2,0.5566336154937744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,4,power_law_1.2,0.7478720188140869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,4,power_law_1.2,0.9673791885375976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,4,power_law_1.2,1.5947903633117675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,4,power_law_1.2,2.032364845275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,4,power_law_1.2,2.419615936279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,4,power_law_1.2,3.9916671752929687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,balanced,10.900848388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,4,power_law_1.2,7.435686492919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,4,power_law_1.2,0.06725119948387145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,4,power_law_1.2,0.0782975971698761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,4,power_law_1.2,0.06670079827308655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,4,power_law_1.2,0.07836160063743591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,balanced,0.05807466804981232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,4,power_law_1.2,0.08896639943122864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,balanced,0.06011199951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,4,power_law_1.2,0.09800320267677307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,balanced,0.08017600079377492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,4,power_law_1.2,0.11715199947357177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,balanced,0.09542399644851685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,4,power_law_1.2,0.1255231976509094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,balanced,0.05216533442338308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,balanced,0.13061333696047464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,4,power_law_1.2,0.13167359828948974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,balanced,0.19569599628448486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,balanced,0.05505066613356272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,4,power_law_1.2,0.13521280288696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,balanced,0.198362668355306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,balanced,0.06649066507816315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,4,power_law_1.2,0.14683519601821898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,balanced,0.19131199518839517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,balanced,0.08140799899895985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,balanced,0.1112000048160553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,balanced,0.19249600172042847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,4,power_law_1.2,0.15971839427947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,balanced,0.16525866587956747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,balanced,0.19504533211390176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,4,power_law_1.2,0.15842560529708863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,balanced,0.1660426656405131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,balanced,0.19951999187469482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,4,power_law_1.2,0.18056319952011107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,balanced,0.1672853430112203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,balanced,0.20327999194463095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,4,power_law_1.2,0.20713601112365723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,balanced,0.17065600554148355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,balanced,0.20661866664886475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,balanced,0.17131733894348145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,4,power_law_1.2,0.21241600513458253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,balanced,0.1731733282407125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,balanced,0.21082667509714761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,4,power_law_1.2,0.24308478832244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,balanced,0.17775466044743857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,balanced,0.21970132986704508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,balanced,0.18302400906880698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,balanced,0.22606400648752847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,balanced,0.18492799997329712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,4,power_law_1.2,0.29271678924560546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,balanced,0.23772799968719482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,balanced,0.19368000825246176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,balanced,0.19977599382400513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,balanced,0.2711306611696879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,balanced,0.21472533543904623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,4,power_law_1.2,0.34700798988342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,balanced,0.3135840098063151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.01,0.05856000185012818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,balanced,0.25013866027196247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,4,power_law_1.2,0.4659071922302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,balanced,0.36982401212056476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,balanced,0.2913600007692973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,4,power_law_1.2,0.5800960063934326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.01,0.06823679804801941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,4,power_law_1.2,0.7994688034057618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.01,0.06538239717483521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,balanced,0.4352746804555257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,balanced,0.3388959964116414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.01,0.08967679738998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,4,power_law_1.2,1.003609561920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,balanced,0.3903839985529582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.01,0.11115520000457764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,balanced,0.5882826646169027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,4,power_law_1.2,1.4978752136230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.01,0.12622079849243165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,4,power_law_1.2,1.8375680923461915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,balanced,0.5513493220011393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.01,0.15358079671859742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,balanced,0.7662453651428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,4,power_law_1.2,2.9439359664916993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.01,0.1570304036140442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.01,0.16510720252990724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,balanced,0.7121493021647135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,4,power_law_1.2,3.4007553100585937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.01,0.17004799842834473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.01,0.17683839797973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,balanced,1.0837706724802654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,4,power_law_1.2,4.706227111816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.01,0.0530239999294281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.01,0.18680959939956665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,balanced,1.020095984141032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.01,0.19831680059432982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,4,power_law_1.2,7.258188629150391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.01,0.06674559712409973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.01,0.20629758834838868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.01,0.05738239884376526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.01,0.22211201190948487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,balanced,1.4051094055175781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.01,0.07364479899406433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,4,power_law_1.2,14.885498046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.01,1.431999969482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,balanced,1.3544692993164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.01,0.09191679954528809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.01,1.4669247627258302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.01,0.10780800580978393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.01,1.5148927688598632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.01,0.128985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.01,1.5269696235656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.01,0.14124799966812135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.01,2.307910346984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,balanced,2.103813330332438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.01,0.14168319702148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,balanced,2.008255958557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,2,power_law_1.2,0.05752320289611816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.01,0.4490496158599854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.01,0.14750080108642577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,2,power_law_1.2,0.06446080207824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.01,0.6122943878173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,2,power_law_1.2,0.06384000182151794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.01,0.15737600326538087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.01,0.7710207939147949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,2,power_law_1.2,0.08480640053749085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.01,1.0861120223999023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.01,0.1621440052986145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,2,power_law_1.2,0.09819520115852357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.01,1.3874624252319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.01,0.1719871997833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,2,power_law_1.2,0.11733759641647339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.01,2.068377685546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.01,0.18778239488601683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,2,power_law_1.2,0.14832639694213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,balanced,2.3632639249165854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.01,2.458700752258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,balanced,2.3858933448791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,2,power_law_1.2,0.1600383996963501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.01,0.20581119060516356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.01,3.1816768646240234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,2,power_law_1.2,0.1588863968849182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.01,0.22445440292358398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,2,power_law_1.2,0.17311999797821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.01,5.03770866394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.01,0.23452799320220946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,2,power_law_1.2,0.17984639406204223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.01,10.947328186035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,2,power_law_1.2,0.18952319622039795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.01,0.28073599338531496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,2,power_law_1.2,0.19916800260543824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.01,0.3051455974578857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,2,power_law_1.2,0.2103935956954956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.01,0.3690880060195923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,2,power_law_1.2,1.4246399879455567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,balanced,3.087168057759603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,balanced,3.072890599568685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.01,0.4482111930847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,2,power_law_1.2,1.4366016387939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,2,power_law_1.2,1.4726207733154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.01,0.5782015800476075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,2,power_law_1.2,1.5233280181884765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.01,0.7375616073608399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,2,power_law_1.2,1.7784000396728517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.01,1.031443214416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,2,power_law_1.2,2.8329727172851564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.01,1.3094719886779784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,2,power_law_1.2,0.4801919937133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.01,1.933420753479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,2,power_law_1.2,0.6442815780639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.01,2.5597440719604494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,2,power_law_1.2,0.8126399993896485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.01,3.050604820251465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,2,power_law_1.2,1.151084804534912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,2,power_law_1.2,1.4246975898742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.01,5.251839828491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,2,power_law_1.2,2.208358383178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,balanced,4.728426615397136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,balanced,4.588549296061198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.01,10.165471649169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,2,power_law_1.2,2.6784576416015624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,2,power_law_1.2,3.412364959716797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,2,power_law_1.2,5.740588760375976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,power_law_1.2,10.707308959960937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,balanced,9.339893341064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,2,balanced,9.049066543579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,2,power_law_1.2,0.05264639854431152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,2,power_law_1.2,0.06552960276603699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,2,power_law_1.2,0.05865600109100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,2,power_law_1.2,0.07441279888153077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,2,power_law_1.2,0.08789119720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,2,power_law_1.2,0.10197759866714477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,2,power_law_1.2,0.1299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,2,power_law_1.2,0.13375999927520751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,2,power_law_1.2,0.13948800563812255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,2,power_law_1.2,0.14665600061416625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,2,power_law_1.2,0.1582335948944092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,2,power_law_1.2,0.15961600542068483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,2,power_law_1.2,0.17468160390853882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,2,power_law_1.2,0.18703360557556153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,2,power_law_1.2,0.2133120059967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,2,power_law_1.2,0.22467200756072997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,2,power_law_1.2,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,2,power_law_1.2,0.285318398475647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,2,power_law_1.2,0.31025280952453616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,balanced,0.02465066562096278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,2,power_law_1.2,0.37626240253448484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,balanced,0.027749332288901012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,2,power_law_1.2,0.45920000076293943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,balanced,0.02756800005833308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,balanced,0.029135999580224354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,2,power_law_1.2,0.5823103904724121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,balanced,0.030048000315825146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,2,power_law_1.2,0.7625343799591064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,balanced,0.027471999327341717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,2,power_law_1.2,1.093900775909424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,balanced,0.030282666285832722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,2,power_law_1.2,1.4563136100769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,balanced,0.03067733347415924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,balanced,0.029829333225886028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,2,power_law_1.2,2.0264320373535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,balanced,0.031146667897701263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,2,power_law_1.2,2.6316736221313475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,balanced,0.028351999819278717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,balanced,0.0308746670683225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,2,power_law_1.2,3.1341567993164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,balanced,0.0317546675602595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,balanced,0.03294933338960012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,balanced,0.029861333469549816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,2,power_law_1.2,5.3586688995361325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,balanced,0.03660800059636434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,balanced,0.03129599988460541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,balanced,0.038218667109807335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,balanced,0.033045334120591484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,2,power_law_1.2,11.309747314453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,balanced,0.0386559988061587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,balanced,0.03429333368937174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,balanced,0.03460799902677536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,balanced,0.04171200096607208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,balanced,0.034448000291983284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,balanced,0.03455466777086258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,balanced,0.04120533416668574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,balanced,0.03487999985615412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,balanced,0.05064000189304352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,balanced,0.035487999518712364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,balanced,0.03571200122435888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,balanced,0.03633599976698557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,balanced,0.047024001677831016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,balanced,0.037920000652472176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,balanced,0.03978666663169861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,balanced,0.05682666599750519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,balanced,0.039477333426475525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,balanced,0.040405333042144775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,balanced,0.057274664441744484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,balanced,0.042266666889190674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,balanced,0.043605332573254905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,balanced,0.047370667258898415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,balanced,0.0698880006869634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,balanced,0.024245334168275196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,balanced,0.05068266888459524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,power_law_1.01,0.030112001299858093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,balanced,0.023413332800070446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,balanced,0.06950399776299794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,balanced,0.07455466687679291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,power_law_1.01,0.029369598627090453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,balanced,0.023621333142121632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,power_law_1.01,0.030156800150871278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,balanced,0.025349333882331848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,balanced,0.07468800246715546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,balanced,0.02566933383544286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,power_law_1.01,0.030649599432945252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,balanced,0.027119999130566914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,power_law_1.01,0.02898559868335724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,balanced,0.027589333554108936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,balanced,0.027514666318893433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,power_law_1.01,0.02885119915008545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,balanced,0.09327999750773112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,balanced,0.027600000301996868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,balanced,0.10338133573532104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,power_law_1.01,0.030623999238014222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,balanced,0.0281333327293396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,power_law_1.01,0.032390400767326355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,balanced,0.02855466554562251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,balanced,0.028704000016053517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,power_law_1.01,0.0350271999835968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,balanced,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,balanced,0.11004799604415894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,balanced,0.029685333371162415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,power_law_1.01,0.03489919900894165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,power_law_1.01,0.03438720107078552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,power_law_1.01,0.03480319976806641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,balanced,0.0322773332397143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,power_law_1.01,0.039705601334571836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,power_law_1.01,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,balanced,0.03190399954716364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,balanced,0.11123200257619222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,power_law_1.01,0.045516800880432126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,power_law_1.01,0.030777600407600404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,power_law_1.01,0.049132800102233885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,power_law_1.01,0.032620799541473386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,power_law_1.01,0.02374400049448013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,power_law_1.01,0.05379840135574341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,balanced,0.1476586659749349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,power_law_1.01,0.03308799862861633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,power_law_1.01,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,power_law_1.01,0.023001599311828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,power_law_1.01,0.03367680013179779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,power_law_1.01,0.0682752013206482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,balanced,0.03257599969704946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,power_law_1.01,0.023398399353027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,power_law_1.01,0.0335999995470047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,power_law_1.01,0.08258559703826904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,power_law_1.01,0.02510719895362854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,power_law_1.01,0.07854080200195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,balanced,0.03502399971087774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,power_law_1.01,0.033907198905944826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,power_law_1.01,0.11964800357818603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,power_law_1.01,0.025593599677085875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,balanced,0.03402133285999298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,power_law_1.01,0.10638079643249512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,power_law_1.01,0.02687999904155731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,power_law_1.01,0.03523840010166168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,power_law_1.01,0.14761600494384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,power_law_1.01,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,power_law_1.01,0.17923200130462646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,power_law_1.01,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,balanced,0.12727466225624084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,power_law_1.01,0.03648639917373657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,balanced,0.1754186749458313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,power_law_1.01,0.26305279731750486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,power_law_1.01,0.02754560112953186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,power_law_1.01,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,power_law_1.01,0.3019455909729004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,power_law_1.01,0.027673599123954774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,power_law_1.01,0.3339839935302734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,power_law_1.01,0.038361600041389464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,balanced,0.04064533362785975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,power_law_1.01,0.02842240035533905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,power_law_1.01,0.04129279851913452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,power_law_1.01,0.6848832130432129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,power_law_1.01,0.029158401489257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,power_law_1.01,0.029747200012207032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,balanced,0.04137066751718521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,power_law_1.01,1.5978879928588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,power_law_1.01,0.031225600838661195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,power_law_1.01,0.03473280072212219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,power_law_1.01,0.044121599197387694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,power_law_1.01,0.03711999952793121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,power_law_1.01,0.05538560152053833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,power_law_1.01,0.057843202352523805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,power_law_1.01,0.04343680143356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,power_law_1.01,0.06734079718589783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,balanced,0.20966400702794394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,balanced,0.04956800242265066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,power_law_1.01,0.08263040184974671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,power_law_1.01,0.054739201068878175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,power_law_1.01,0.06391680240631104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,power_law_1.01,0.10011520385742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,power_law_1.01,0.11324160099029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,balanced,0.05754666527112325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,power_law_1.01,0.17151360511779784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,balanced,0.18729066848754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,power_law_1.01,0.0689791977405548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,power_law_1.01,0.1840831995010376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,power_law_1.01,0.08723199963569642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,power_law_1.01,0.2624639987945557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,power_law_1.01,0.36666240692138674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,power_law_1.01,0.09765759706497193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,power_law_1.01,0.4806975841522217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,power_law_1.01,0.14547840356826783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,power_law_1.01,0.6596543788909912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,power_law_1.01,1.3919360160827636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,balanced,0.07419200241565704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,power_law_1.01,0.1791424036026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,64,power_law_1.2,0.026092800498008727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,balanced,0.3104853431383769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,64,power_law_1.2,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,64,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,power_law_1.01,0.2212735891342163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,balanced,0.08775466680526733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,64,power_law_1.2,0.02956160008907318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,64,power_law_1.2,0.035097599029541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,power_law_1.01,0.42386560440063475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,64,power_law_1.2,0.03027839958667755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,power_law_1.01,0.5310976028442382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,64,power_law_1.2,0.030291199684143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,64,power_law_1.2,0.02873600125312805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,64,power_law_1.2,0.03091199994087219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,64,power_law_1.2,0.02892799973487854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,64,power_law_1.2,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,64,power_law_1.2,0.030796799063682555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,balanced,0.11868799726168315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,64,power_law_1.2,0.03311359882354736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,64,power_law_1.2,0.03239679932594299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,64,power_law_1.2,0.03258239924907684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,64,power_law_1.2,0.03381119966506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,64,power_law_1.2,0.03404799997806549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,power_law_1.01,0.609600019454956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,64,power_law_1.2,0.03367680013179779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,64,power_law_1.2,0.03591679930686951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,power_law_1.01,1.2912960052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,64,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,64,power_law_1.2,0.035648000240325925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,64,power_law_1.2,0.03565439879894257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,64,power_law_1.2,0.04286719858646393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,power_law_1.01,2.161465644836426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,64,power_law_1.2,0.0525439977645874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,64,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,balanced,0.146314670642217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,64,power_law_1.2,0.05249279737472534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,64,power_law_1.2,0.03654400110244751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,balanced,0.32366400957107544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,64,power_law_1.2,0.05767679810523987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,64,power_law_1.2,0.03681919872760773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,64,power_law_1.2,0.07137920260429383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,64,power_law_1.2,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,64,power_law_1.2,0.08257279992103576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,64,power_law_1.2,0.03858560025691986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,64,power_law_1.2,0.10714880228042603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,64,power_law_1.2,0.04208639860153198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,64,power_law_1.2,0.09139840006828308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,64,power_law_1.2,0.13472000360488892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,64,power_law_1.2,0.04301440119743347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,64,power_law_1.2,0.13891199827194214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,64,power_law_1.2,0.04997760057449341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,64,power_law_1.2,0.17486720085144042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,64,power_law_1.2,0.05610880255699158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,balanced,0.5772746801376343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,balanced,0.17618666092554727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,64,power_law_1.2,0.28348801136016843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,64,power_law_1.2,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,64,power_law_1.2,0.39466879367828367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,64,power_law_1.2,0.0905344009399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,64,power_law_1.2,0.5153151988983155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,64,power_law_1.2,0.09111679792404175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,64,power_law_1.2,0.12896000146865844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,64,power_law_1.2,0.6812479972839356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,64,power_law_1.2,0.13326079845428468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,64,power_law_1.2,1.0638336181640624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,64,power_law_1.2,0.22001280784606933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,64,power_law_1.2,2.692095947265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,64,power_law_1.2,0.2470911979675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,64,power_law_1.2,0.370035195350647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,64,power_law_1.2,0.5071487903594971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,64,power_law_1.2,0.6806399822235107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,balanced,0.2646239995956421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,64,power_law_1.2,1.2531135559082032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,64,power_law_1.2,2.9196544647216798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,64,power_law_1.2,0.023654399812221526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,64,power_law_1.2,0.022918400168418885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,64,power_law_1.2,0.02325119972229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,64,power_law_1.2,0.02503040134906769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,64,power_law_1.2,0.02558720111846924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,64,power_law_1.2,0.026873600482940675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,64,power_law_1.2,0.0271807998418808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,64,power_law_1.2,0.027187201380729675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,balanced,0.5373706817626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,64,power_law_1.2,0.02733440101146698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,64,power_law_1.2,0.027718400955200194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,64,power_law_1.2,0.0290367990732193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,64,power_law_1.2,0.029631999135017396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,64,power_law_1.2,0.029996800422668456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,balanced,0.025568000972270966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,64,power_law_1.2,0.03165439963340759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,balanced,0.022650666534900665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,64,power_law_1.2,0.038841599225997926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,balanced,0.02274133265018463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,64,power_law_1.2,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,balanced,0.024010665714740753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,balanced,0.026714667677879333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,balanced,0.02754133443037669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,64,power_law_1.2,0.04678399860858917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,balanced,0.027471999327341717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,64,power_law_1.2,0.06197119951248169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,balanced,0.0276853342851003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,64,power_law_1.2,0.06773759722709656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,balanced,0.02826666583617528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,balanced,0.028223998844623566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,64,power_law_1.2,0.0859008014202118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,balanced,0.02865600089232127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,64,power_law_1.2,0.114028799533844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,balanced,0.028944000601768494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,balanced,0.0296426663796107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,balanced,0.03551466763019562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,64,power_law_1.2,0.13834240436553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,balanced,0.03718933214743932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,64,power_law_1.2,0.18110079765319825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,balanced,0.037317333122094475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,balanced,0.038618666430314384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,balanced,0.04049599915742874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,64,power_law_1.2,0.3453376054763794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,balanced,0.041696002086003624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,64,power_law_1.2,0.42315521240234377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,balanced,0.04984533290068308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,64,power_law_1.2,0.5683839797973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,balanced,0.04872000217437744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,64,power_law_1.2,0.8309503555297851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,balanced,0.030784000953038532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,balanced,0.059749335050582886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,balanced,0.029232000311215717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,64,power_law_1.2,1.2193984031677245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,balanced,0.029264000554879505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,64,power_law_1.2,1.7091583251953124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,balanced,0.03268799930810928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,balanced,0.06043733159701029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,balanced,0.032629333436489105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,balanced,0.03399466723203659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,64,power_law_1.2,4.04461441040039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,balanced,0.03435199956099192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,balanced,0.03403733422358831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,power_law_1.01,0.028089600801467895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,balanced,0.07486400008201599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,balanced,0.03425599883000056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,balanced,0.02382933348417282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,power_law_1.01,0.023955200612545014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,balanced,0.03461866577466329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,balanced,0.023530667026837666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,power_law_1.01,0.02237440049648285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,balanced,0.035274667044480644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,balanced,0.023845332364241283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,power_law_1.01,0.024108800292015075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,balanced,0.03526400029659271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,balanced,0.025834667185942333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,balanced,0.08406399687131245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,power_law_1.01,0.02475520074367523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,balanced,0.035989334185918175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,balanced,0.02640533447265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,power_law_1.01,0.026604801416397095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,power_law_1.01,0.036748799681663516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,balanced,0.03743999948104223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,balanced,0.027445333699385326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,power_law_1.01,0.027596798539161683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,balanced,0.039701332648595176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,balanced,0.027797333896160126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,power_law_1.01,0.03136000037193298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,power_law_1.01,0.027744001150131224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,balanced,0.02739733209212621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,balanced,0.03937600056330363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,power_law_1.01,0.03054080009460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,power_law_1.01,0.029862400889396668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,balanced,0.02759466568628947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,balanced,0.040549332896868386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,power_law_1.01,0.03278079926967621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,power_law_1.01,0.03115519881248474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,balanced,0.11283199985822041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,balanced,0.028165332973003387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,power_law_1.01,0.0319680005311966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,balanced,0.04261866708596548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,power_law_1.01,0.03251200020313263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,balanced,0.028336000939210255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,power_law_1.01,0.033580800890922545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,balanced,0.04289066791534424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,power_law_1.01,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,power_law_1.01,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,balanced,0.05137600004673004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,power_law_1.01,0.03759360015392303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,balanced,0.030320001145203907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,power_law_1.01,0.03378559947013855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,power_law_1.01,0.04078719913959503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,power_law_1.01,0.03470079898834229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,balanced,0.053685332338015236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,balanced,0.02977599948644638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,power_law_1.01,0.04355199933052063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,power_law_1.01,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,balanced,0.12756799658139548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,power_law_1.01,0.024614399671554564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,power_law_1.01,0.046086400747299194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,balanced,0.033333333830038704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,power_law_1.01,0.035955199599266054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,power_law_1.01,0.023468799889087677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,power_law_1.01,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,power_law_1.01,0.036723199486732486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,balanced,0.03296533226966858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,power_law_1.01,0.02316800057888031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,power_law_1.01,0.061459201574325564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,power_law_1.01,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,power_law_1.01,0.025382399559020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,balanced,0.07957333326339722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,power_law_1.01,0.07203199863433837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,power_law_1.01,0.039136001467704774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,power_law_1.01,0.026316800713539125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,power_law_1.01,0.0735871970653534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,power_law_1.01,0.04237439930438995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,power_law_1.01,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,power_law_1.01,0.08672000169754028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,power_law_1.01,0.042931199073791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,power_law_1.01,0.02736639976501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,power_law_1.01,0.09870079755783082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,balanced,0.03410666684309641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,balanced,0.09976533055305481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,power_law_1.01,0.044838398694992065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,power_law_1.01,0.027775999903678895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,power_law_1.01,0.1324288010597229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,balanced,0.14710399508476257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,balanced,0.036720000207424164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,power_law_1.01,0.028326401114463808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,power_law_1.01,0.050220799446105954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,power_law_1.01,0.1566912055015564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,power_law_1.01,0.02948479950428009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,power_law_1.01,0.05486720204353333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,balanced,0.03626666714747747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,power_law_1.01,0.2534463882446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,power_law_1.01,0.029760000109672547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,power_law_1.01,0.06650879979133606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,balanced,0.11732266346613567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,power_law_1.01,0.31325440406799315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,power_law_1.01,0.030956798791885377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,power_law_1.01,0.0760640025138855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,power_law_1.01,0.03223679959774017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,power_law_1.01,0.09410560131072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,power_law_1.01,0.3946239948272705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,power_law_1.01,0.034668800234794614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,power_law_1.01,0.1177024006843567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,power_law_1.01,0.599564790725708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,power_law_1.01,0.03616639971733093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,balanced,0.04364799956480662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,power_law_1.01,0.15296640396118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,power_law_1.01,0.9801088333129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,power_law_1.01,0.03940480053424835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,power_law_1.01,0.19875199794769288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,balanced,0.16049599647521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,balanced,0.04593066871166229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,power_law_1.01,0.2816384077072144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,power_law_1.01,0.33978240489959716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,power_law_1.01,0.04266240000724793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,power_law_1.01,0.4440320014953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,power_law_1.01,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,power_law_1.01,0.6674431800842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,power_law_1.01,0.060761600732803345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,balanced,0.2232960065205892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,balanced,0.05792533357938131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,power_law_1.01,1.453343963623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,balanced,0.1957226594289144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,power_law_1.01,0.07153279781341552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,balanced,0.06798933446407318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,power_law_1.01,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,32,power_law_1.2,0.02791680097579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,power_law_1.01,0.10700160264968872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,32,power_law_1.2,0.02268799990415573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,power_law_1.01,0.12290560007095337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,32,power_law_1.2,0.024243199825286867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,32,power_law_1.2,0.025043201446533204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,balanced,0.2344906727472941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,32,power_law_1.2,0.02736000120639801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,balanced,0.08727467060089111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,power_law_1.01,0.17893760204315184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,32,power_law_1.2,0.027667200565338133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,32,power_law_1.2,0.029734399914741517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,32,power_law_1.2,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,32,power_law_1.2,0.03194240033626557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,power_law_1.01,0.23510398864746093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,32,power_law_1.2,0.0338239997625351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,power_law_1.01,0.38702080249786375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,32,power_law_1.2,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,balanced,0.10687999924023946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,32,power_law_1.2,0.03527680039405823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,power_law_1.01,0.571999979019165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,32,power_law_1.2,0.03916159868240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,power_law_1.01,0.7066751956939697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,32,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,32,power_law_1.2,0.04490880072116852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,power_law_1.01,0.9320511817932129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,32,power_law_1.2,0.05092480182647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,32,power_law_1.2,0.052883201837539674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,power_law_1.01,2.0124095916748046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,balanced,0.14786666631698608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,32,power_law_1.2,0.06503040194511414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,balanced,0.3526346683502197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,32,power_law_1.2,0.08463360071182251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,balanced,0.3962080081303914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,32,power_law_1.2,0.08829439878463745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,32,power_law_1.2,0.11020799875259399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,32,power_law_1.2,0.11615359783172607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,32,power_law_1.2,0.17148799896240235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,32,power_law_1.2,0.19325439929962157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,balanced,0.1847040057182312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,32,power_law_1.2,0.32860798835754396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,32,power_law_1.2,0.37029759883880614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,32,power_law_1.2,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,32,power_law_1.2,0.5853695869445801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,32,power_law_1.2,0.030508801341056824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,32,power_law_1.2,1.0964991569519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,32,power_law_1.2,0.029337599873542786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,32,power_law_1.2,0.03313280045986176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,32,power_law_1.2,2.62992000579834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,32,power_law_1.2,0.03224320113658905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,32,power_law_1.2,0.03370240032672882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,32,power_law_1.2,0.03333759903907776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,32,power_law_1.2,0.03426559865474701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,balanced,0.22806400060653687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,32,power_law_1.2,0.03442560136318207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,32,power_law_1.2,0.03447679877281189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,32,power_law_1.2,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,32,power_law_1.2,0.03709439933300018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,32,power_law_1.2,0.03749119937419891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,32,power_law_1.2,0.038790398836135866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,32,power_law_1.2,0.04294399917125702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,32,power_law_1.2,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,32,power_law_1.2,0.04622080028057098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,32,power_law_1.2,0.052857601642608644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,32,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,balanced,0.6657013495763143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,32,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,32,power_law_1.2,0.08094720244407654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,32,power_law_1.2,0.10566400289535523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,32,power_law_1.2,0.13638399839401244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,32,power_law_1.2,0.18298239707946778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,32,power_law_1.2,0.2528512001037598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,balanced,0.36870400110880536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,32,power_law_1.2,0.3046720027923584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,32,power_law_1.2,0.4484864234924316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,32,power_law_1.2,0.5945280075073243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,32,power_law_1.2,1.0604736328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,32,power_law_1.2,2.108998489379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,32,power_law_1.2,0.024716800451278685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,32,power_law_1.2,0.023507200181484222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,32,power_law_1.2,0.023507200181484222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,balanced,0.022101332743962605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,32,power_law_1.2,0.02534399926662445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,balanced,0.022101332743962605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,balanced,0.7102986971537272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,32,power_law_1.2,0.026265600323677064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,balanced,0.022431999444961548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,32,power_law_1.2,0.027449598908424376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,balanced,0.024133334557215374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,32,power_law_1.2,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,balanced,0.026816000541051228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,32,power_law_1.2,0.028230398893356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,balanced,0.028058665494124096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,32,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,balanced,0.027893332143624622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,32,power_law_1.2,0.02890239953994751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,balanced,0.028229333460330963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,32,power_law_1.2,0.029529601335525513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,32,power_law_1.2,0.03185920119285583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,balanced,0.02905600021282832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,32,power_law_1.2,0.031615999341011045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,balanced,0.02887466549873352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,32,power_law_1.2,0.03407999873161316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,balanced,0.02938133229811986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,32,power_law_1.2,0.03948160111904144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,balanced,0.029605334003766377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,balanced,0.031301334500312805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,32,power_law_1.2,0.041465601325035094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,balanced,0.03562133262554804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,balanced,0.03781333317359289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,32,power_law_1.2,0.04479359984397888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,balanced,0.04109866668780645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,32,power_law_1.2,0.05601279735565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,32,power_law_1.2,0.06862720251083373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,balanced,0.040949332217375435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,balanced,0.043663998444875084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,32,power_law_1.2,0.0749504029750824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,balanced,0.04844266672929128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,32,power_law_1.2,0.09468799829483032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,balanced,0.030250666042168934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,32,power_law_1.2,0.12058240175247192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,balanced,0.05260799825191498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,balanced,0.030261332790056866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,32,power_law_1.2,0.16206719875335693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,balanced,0.029994666576385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,balanced,0.06516266862551372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,balanced,0.033200000723203026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,balanced,0.033370666205883026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,32,power_law_1.2,0.2701184034347534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,balanced,0.03505599995454153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,balanced,0.03551999976237615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,balanced,0.0672106643517812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,balanced,0.03537066777547201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,32,power_law_1.2,0.31676158905029295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,balanced,0.03552533437808355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,32,power_law_1.2,0.5260416030883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,balanced,0.03612266729275385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,balanced,0.023946667710940044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,balanced,0.0359946663180987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,balanced,0.08699199557304382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,power_law_1.01,0.026393601298332216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,32,power_law_1.2,0.7308928012847901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,balanced,0.036288000643253326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,balanced,0.023818666736284893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,32,power_law_1.2,0.7803135871887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,power_law_1.01,0.023270399868488313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,balanced,0.03714666763941447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,balanced,0.024362665911515553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,balanced,0.03792533278465271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,power_law_1.01,0.022457599639892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,32,power_law_1.2,1.6846656799316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,balanced,0.040549332896868386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,balanced,0.026799999177455902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,power_law_1.01,0.0234047994017601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,balanced,0.03994666785001755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,balanced,0.09642133116722107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,balanced,0.027130665878454845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,32,power_law_1.2,3.6859840393066405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,power_law_1.01,0.02481919974088669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,balanced,0.0417546679576238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,balanced,0.028650666276613872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,power_law_1.01,0.026892799139022826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,balanced,0.04517866671085358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,balanced,0.02905600021282832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,power_law_1.01,0.026995199918746948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,balanced,0.04584000011285146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,balanced,0.02849599967400233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,balanced,0.028736000259717304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,power_law_1.01,0.027481600642204285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,balanced,0.05390933156013489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,balanced,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,balanced,0.1377226710319519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,power_law_1.01,0.03172479867935181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,balanced,0.02959999938805898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,balanced,0.06039466460545858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,power_law_1.01,0.03177599906921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,balanced,0.030373332401116688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,balanced,0.030960001051425934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,balanced,0.07765866816043854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,power_law_1.01,0.03308799862861633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,power_law_1.01,0.036800000071525577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,balanced,0.031386665999889374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,power_law_1.01,0.03329919874668121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,power_law_1.01,0.030668801069259642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,balanced,0.08798399567604065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,power_law_1.01,0.03457919955253601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,balanced,0.03615466753641764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,power_law_1.01,0.030131199955940248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,power_law_1.01,0.040006399154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,balanced,0.16523200273513794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,balanced,0.0355679988861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,power_law_1.01,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,power_law_1.01,0.04344319999217987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,power_law_1.01,0.032620799541473386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,balanced,0.11475200454394023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,power_law_1.01,0.04529280066490173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,power_law_1.01,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,power_law_1.01,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,power_law_1.01,0.05589119791984558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,balanced,0.03665599972009659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,power_law_1.01,0.05622400045394897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,balanced,0.13529599706331888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,power_law_1.01,0.03614720106124878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,balanced,0.03992533435424169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,power_law_1.01,0.06747519969940186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,power_law_1.01,0.03683840036392212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,power_law_1.01,0.026630398631095887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,power_law_1.01,0.07214720249176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,balanced,0.04085866610209147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,balanced,0.19681066274642944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,power_law_1.01,0.037145599722862244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,power_law_1.01,0.09402880072593689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,power_law_1.01,0.02433920055627823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,power_law_1.01,0.038406398892402646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,power_law_1.01,0.10324480533599853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,power_law_1.01,0.02439039945602417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,power_law_1.01,0.026528000831604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,power_law_1.01,0.038924801349639895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,power_law_1.01,0.14027520418167114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,balanced,0.1925440033276876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,power_law_1.01,0.026771199703216553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,power_law_1.01,0.040294399857521056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,power_law_1.01,0.14867839813232422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,power_law_1.01,0.028537601232528687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,balanced,0.05691733459631602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,power_law_1.01,0.04377599954605103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,power_law_1.01,0.2554431915283203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,power_law_1.01,0.028697600960731505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,power_law_1.01,0.04508160054683685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,power_law_1.01,0.32369279861450195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,power_law_1.01,0.029395198822021483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,power_law_1.01,0.030393600463867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,power_law_1.01,0.4047872066497803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,power_law_1.01,0.05270400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,power_law_1.01,0.03160960078239441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,balanced,0.07410133381684621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,power_law_1.01,0.5340544223785401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,power_law_1.01,0.055801600217819214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,balanced,0.23836799462636313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,power_law_1.01,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,power_law_1.01,0.07276800274848938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,power_law_1.01,1.233779239654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,power_law_1.01,0.03370879888534546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,balanced,0.08668800195058186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,power_law_1.01,0.08593279719352723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,power_law_1.01,0.03666560053825378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,balanced,0.30079466104507446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,power_law_1.01,0.10625920295715333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,power_law_1.01,0.12191359996795655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,power_law_1.01,0.03976959884166718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,power_law_1.01,0.16874879598617554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,power_law_1.01,0.041043201088905336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,power_law_1.01,0.19998079538345337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,16,power_law_1.2,0.02655999958515167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,balanced,0.11593600114186604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,power_law_1.01,0.2873536109924316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,16,power_law_1.2,0.02210559993982315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,power_law_1.01,0.04520959854125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,balanced,0.2890773415565491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,power_law_1.01,0.3610879898071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,16,power_law_1.2,0.022361600399017335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,power_law_1.01,0.05433599948883057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,16,power_law_1.2,0.02414720058441162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,power_law_1.01,0.44688639640808103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,power_law_1.01,0.06516479849815368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,16,power_law_1.2,0.024383999407291412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,power_law_1.01,0.7671040058135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,16,power_law_1.2,0.02730880081653595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,power_law_1.01,0.0729856014251709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,16,power_law_1.2,0.027871999144554137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,power_law_1.01,1.5118847846984864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,16,power_law_1.2,0.029363200068473816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,power_law_1.01,0.08725119829177856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,16,power_law_1.2,0.031916800141334536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,balanced,0.1435413360595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,16,power_law_1.2,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,power_law_1.01,0.11573760509490967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,16,power_law_1.2,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,16,power_law_1.2,0.0339711993932724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,power_law_1.01,0.14625279903411864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,16,power_law_1.2,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,16,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,power_law_1.01,0.22715520858764648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,16,power_law_1.2,0.044019201397895814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,balanced,0.2206666668256124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,16,power_law_1.2,0.04737919867038727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,16,power_law_1.2,0.04865280091762543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,power_law_1.01,0.26044158935546874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,16,power_law_1.2,0.059545600414276124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,balanced,0.4542773167292277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,power_law_1.01,0.44068479537963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,16,power_law_1.2,0.06037120223045349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,power_law_1.01,0.6521024227142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,16,power_law_1.2,0.07061120271682739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,16,power_law_1.2,0.08428800106048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,power_law_1.01,0.788153600692749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,16,power_law_1.2,0.10295679569244384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,power_law_1.01,1.1471936225891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,16,power_law_1.2,0.11585279703140258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,16,power_law_1.2,0.16270079612731933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,power_law_1.01,2.848601531982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,balanced,0.28676267464955646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,16,power_law_1.2,0.18853119611740113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,balanced,0.5634826819101969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,16,power_law_1.2,0.3021440029144287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,16,power_law_1.2,0.4884352207183838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,16,power_law_1.2,0.6493760108947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,16,power_law_1.2,0.8094911575317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,16,power_law_1.2,2.1659584045410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,balanced,0.3524373372395833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,16,power_law_1.2,0.03681280016899109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,16,power_law_1.2,0.030374398827552794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,balanced,0.858400026957194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,16,power_law_1.2,0.030239999294281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,16,power_law_1.2,0.03218559920787811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,balanced,0.5407093365987142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,16,power_law_1.2,0.032601600885391234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,16,power_law_1.2,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,16,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,16,power_law_1.2,0.035519999265670774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,16,power_law_1.2,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,16,power_law_1.2,0.036556801199913024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,16,power_law_1.2,0.03840000033378601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,16,power_law_1.2,0.0389055997133255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,16,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,16,power_law_1.2,0.040575999021530154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,16,power_law_1.2,0.04424319863319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,16,power_law_1.2,0.045900800824165346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,16,power_law_1.2,0.04785279929637909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,16,power_law_1.2,0.05483520030975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,16,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,16,power_law_1.2,0.07411839962005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,16,power_law_1.2,0.0862272024154663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,16,power_law_1.2,0.12417919635772705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,16,power_law_1.2,0.13244160413742065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,16,power_law_1.2,0.20220160484313965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,16,power_law_1.2,0.2311487913131714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,balanced,1.0595253308614094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,16,power_law_1.2,0.4103231906890869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,16,power_law_1.2,0.6665728092193604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,16,power_law_1.2,0.026719999313354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,16,power_law_1.2,0.6782271862030029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,16,power_law_1.2,0.024486400187015533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,16,power_law_1.2,0.02462079972028732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,16,power_law_1.2,1.1096256256103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,16,power_law_1.2,0.0268095999956131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,16,power_law_1.2,0.02707839906215668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,16,power_law_1.2,2.329952049255371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,16,power_law_1.2,0.028755199909210206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,16,power_law_1.2,0.028748801350593566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,16,power_law_1.2,0.031091201305389404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,16,power_law_1.2,0.030963200330734252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,16,power_law_1.2,0.03147520124912262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,16,power_law_1.2,0.032332798838615416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,16,power_law_1.2,0.03331199884414673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,balanced,0.04553600152333578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,16,power_law_1.2,0.03386879861354828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,balanced,0.04326933125654856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,16,power_law_1.2,0.03803519904613495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,balanced,0.04320533573627472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,balanced,0.045114666223526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,16,power_law_1.2,0.04180479943752289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,balanced,0.05797333518664042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,16,power_law_1.2,0.04506880044937134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,balanced,0.05878399809201559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,balanced,0.058970664938290916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,balanced,0.058789332707722984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,16,power_law_1.2,0.048403200507164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,balanced,0.059194669127464294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,16,power_law_1.2,0.056985598802566526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,balanced,0.059077332417170204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,16,power_law_1.2,0.06885759830474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,balanced,0.06035733222961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,balanced,0.06113066772619883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,16,power_law_1.2,0.0773248016834259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,balanced,0.061162665486335754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,16,power_law_1.2,0.10239360332489014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,balanced,0.0613919993241628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,balanced,0.06436799963315327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,16,power_law_1.2,0.13281279802322388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,balanced,0.03561066587766012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,balanced,0.06482133269309998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,16,power_law_1.2,0.16395519971847533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,balanced,0.06620266536871593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,balanced,0.036517334481080375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,balanced,0.06929600238800049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,16,power_law_1.2,0.3220799922943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.053337597846984865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,balanced,0.036687999963760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.04878079891204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,balanced,0.06940266489982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,balanced,0.03873066604137421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,16,power_law_1.2,0.4207295894622803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.04865280091762543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,balanced,0.08141866823037465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,16,power_law_1.2,0.6119232177734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,balanced,0.04330666859944662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.05562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,balanced,0.04268800218900045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,16,power_law_1.2,0.8622591972351075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.05419520139694214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,balanced,0.07674666742483775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,balanced,0.0429066667954127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,16,power_law_1.2,1.3271295547485351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.058316802978515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,balanced,0.028949332733949024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.05768960118293762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,balanced,0.09389866391817729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,16,power_law_1.2,1.7351743698120117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,balanced,0.043231998880704246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,balanced,0.02889599899450938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,balanced,0.028746667007605236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,balanced,0.04566933214664459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.0585919976234436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,16,power_law_1.2,4.326700973510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,balanced,0.0308693324526151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,balanced,0.09711466232935588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,balanced,0.04633066554864248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,balanced,0.035573333501815796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.06074240207672119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,balanced,0.0367999995748202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.06094080209732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,balanced,0.04674666623274485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.037913599610328676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,balanced,0.036687999963760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.06877440214157104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,balanced,0.0372533326347669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,balanced,0.04816000163555145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,balanced,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,balanced,0.13184533516565958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,balanced,0.04934399823347727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.037350401282310486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,balanced,0.03739733248949051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,balanced,0.039135999977588654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.041196799278259276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,balanced,0.03968533376852671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.04147840142250061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,balanced,0.05542933444182078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,balanced,0.04038399954636892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.09434880018234253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,balanced,0.05875733494758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,balanced,0.04102933406829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,balanced,0.13566399614016214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.041388800740242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,balanced,0.04906666775544485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,balanced,0.0631573349237442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.04456959962844849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,balanced,0.04931733508904775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.1309056043624878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.04444800019264221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,balanced,0.06630399823188782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.04780159890651703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.12215679883956909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.0500544011592865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,balanced,0.07805333534876506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.147871994972229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.051148802042007446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.0537663996219635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.16033920049667358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,balanced,0.20617065827051798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,balanced,0.08443733056386311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.05431680083274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.22901759147644044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.2449984073638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,balanced,0.05004266897837321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.06865919828414917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.01,0.33045120239257814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,balanced,0.10106133421262105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,balanced,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.06599680185317994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.01,0.5047039985656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.0865664005279541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,balanced,0.05569066603978475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.09025920033454896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.01,0.5945600032806396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,balanced,0.11645866433779399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.12067840099334717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.01,0.9802495956420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.12706559896469116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,balanced,0.23202667633692423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.01,1.0072959899902343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.17025279998779297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,balanced,0.15569067001342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.01,1.724787139892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.20446720123291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.30919680595397947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,balanced,0.06458666423956554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.01,4.008838272094726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.4035071849822998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,0.50862717628479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,balanced,0.06829333305358887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,0.7345791816711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,balanced,0.18099733193715414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.01,0.8425215721130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.01,1.2707455635070801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,balanced,0.26321067412694293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.01,3.351871871948242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,balanced,0.08377599716186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,balanced,0.2622239987055461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,balanced,0.09383466839790344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,power_law_1.01,0.031865599751472476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,power_law_1.01,0.030796799063682555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,power_law_1.01,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,balanced,0.31988267103830975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,power_law_1.01,0.03450239896774292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,balanced,0.12387200196584065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,power_law_1.01,0.03562879860401154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,power_law_1.01,0.03646079897880554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,balanced,0.3762880166371663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,power_law_1.01,0.03713920116424561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,power_law_1.01,0.03978239893913269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,power_law_1.01,0.04136320054531097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,balanced,0.14754133423169455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,64,power_law_1.2,0.053350400924682614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,power_law_1.01,0.051052802801132204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,power_law_1.01,0.05738239884376526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,balanced,0.3785333236058553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,64,power_law_1.2,0.046700799465179445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,power_law_1.01,0.06247040033340454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,64,power_law_1.2,0.04910080134868622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,power_law_1.01,0.067603200674057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,64,power_law_1.2,0.054073601961135864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,balanced,0.20698134104410806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,64,power_law_1.2,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,64,power_law_1.2,0.05802879929542541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,power_law_1.01,0.06862080097198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,64,power_law_1.2,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,power_law_1.01,0.08478080034255982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,64,power_law_1.2,0.05921279788017273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.01,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,64,power_law_1.2,0.059673601388931276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,64,power_law_1.2,0.06083199977874756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,64,power_law_1.2,0.06444159746170045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.01,0.10665600299835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,balanced,0.2632213234901428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,64,power_law_1.2,0.07178879976272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.01,0.16414079666137696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,64,power_law_1.2,0.08330240249633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,64,power_law_1.2,0.07712640166282654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.01,0.17902719974517822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,balanced,0.5784639914830526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,64,power_law_1.2,0.09048960208892823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.01,0.28548479080200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,64,power_law_1.2,0.10068479776382447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,64,power_law_1.2,0.10739840269088745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.01,0.45279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,64,power_law_1.2,0.13812479972839356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.01,0.5666240215301513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,64,power_law_1.2,0.1444991946220398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.01,0.7875711917877197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,64,power_law_1.2,0.1862720012664795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.01,1.1085311889648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,64,power_law_1.2,0.1958080053329468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,64,power_law_1.2,0.362611198425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,balanced,0.7145226796468099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,64,power_law_1.2,0.3944704055786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,balanced,0.33507732550303143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,power_law_1.01,1.3587519645690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,64,power_law_1.2,0.5525760173797607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,power_law_1.01,2.189107131958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,64,power_law_1.2,0.7039936065673829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,64,power_law_1.2,0.9522303581237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,power_law_1.01,4.996774291992187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,64,power_law_1.2,1.515225601196289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,64,power_law_1.2,1.6715456008911134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.0381056010723114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,64,power_law_1.2,3.3771007537841795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.03591679930686951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,64,power_law_1.2,7.3468482971191404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.04145280122756958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.04184960126876831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.041177600622177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.041945600509643556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,balanced,0.5304906765619913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.045023998618125914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,balanced,1.1128640174865723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.04808320105075836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.05103359818458557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.05260159969329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.05539839863777161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.05630720257759094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.06855040192604064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.06894720196723939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.07932159900665284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.0905023992061615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.11072640419006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.13482880592346191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.1456704020500183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.2228287935256958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.24042880535125732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,0.40344958305358886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,64,power_law_1.2,0.030399999022483824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,0.49176321029663084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,64,power_law_1.2,0.028780800104141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,0.8862591743469238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,balanced,0.03514666606982549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,64,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,1.0978816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,64,power_law_1.2,0.032876798510551454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,balanced,0.0346666673819224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,64,power_law_1.2,0.03270399868488312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,64,power_law_1.2,1.4973312377929688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,balanced,1.0564160346984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,balanced,0.034901333351929985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,64,power_law_1.2,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,64,power_law_1.2,2.2729984283447267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,64,power_law_1.2,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,balanced,0.045007998744646706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,64,power_law_1.2,0.03671039938926697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,balanced,0.05685333410898844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,64,power_law_1.2,5.750207901000977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,64,power_law_1.2,0.0423552006483078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,balanced,0.058101331194241844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,64,power_law_1.2,0.04622080028057098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,balanced,0.05756799876689911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,64,power_law_1.2,0.04890879988670349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,balanced,0.05811200042565664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,64,power_law_1.2,0.05538560152053833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,balanced,0.05807999769846598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,64,power_law_1.2,0.05453439950942993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,balanced,0.058143998185793556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,64,power_law_1.2,0.059654402732849124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,balanced,0.05930666625499725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,balanced,0.06029333174228668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,64,power_law_1.2,0.07051519751548767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,balanced,0.05972800155480703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,64,power_law_1.2,0.09253119826316833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,balanced,0.0628053347269694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,balanced,0.06427733103434245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,64,power_law_1.2,0.08584960103034973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,balanced,0.0658186674118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,64,power_law_1.2,0.10195200443267823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,balanced,0.06541333099206288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.2,0.1227455973625183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,balanced,0.07501866420110066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,balanced,0.07026133437951405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.2,0.17715840339660643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.2,0.22120959758758546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,balanced,0.08136533200740814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,balanced,0.07885866860548656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.2,0.3041599988937378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.2,0.3928512096405029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,balanced,0.09683199723561604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.2,0.7133632183074952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.2,0.9715135574340821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,balanced,0.10089066624641418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.2,1.4685248374938964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.2,2.0216064453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,balanced,0.14088533322016397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,64,power_law_1.2,2.3521663665771486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,balanced,0.03450666616360346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,64,power_law_1.2,4.510496139526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,balanced,0.03632533301909765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,balanced,0.035029334326585136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,balanced,0.036650667587916054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,64,power_law_1.2,8.945887756347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,balanced,0.1476746698220571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,balanced,0.03975466638803482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,balanced,0.041034666200478874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,balanced,0.042133331298828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,balanced,0.04188799858093262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,balanced,0.04171200096607208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,balanced,0.044906665881474815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,balanced,0.045221333702405296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,balanced,0.045791998505592346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,balanced,0.22197333971659342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.01,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,balanced,0.047237331668535866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,balanced,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.01,0.04933120012283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,balanced,0.05509866774082184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.01,0.04469119906425476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,balanced,0.05494399865468343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.01,0.04997760057449341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.01,0.051507198810577394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,balanced,0.06651199857393901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.01,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,balanced,0.06730666756629944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.01,0.05607039928436279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,balanced,0.2568693359692891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,balanced,0.08009600142637889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,balanced,0.02771199991305669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.01,0.05982080101966858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,balanced,0.027493332823117573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,balanced,0.0860586663087209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.01,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,balanced,0.027493332823117573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,balanced,0.030576000610987347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,balanced,0.10572800040245056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,balanced,0.0349440003434817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.01,0.06160640120506287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,balanced,0.03656533360481262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.01,0.0651968002319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,balanced,0.03711999952793121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.01,0.04376319944858551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,balanced,0.12148267030715942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,balanced,0.03631466627120972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.01,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.01,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,balanced,0.036501333117485046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.01,0.07501440048217774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.01,0.036339199542999266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,balanced,0.0378560001651446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,balanced,0.3296266595522563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.01,0.08126720190048217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.01,0.036160001158714296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,balanced,0.03902400036652883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,balanced,0.1663146714369456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.01,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.01,0.08165119886398316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,balanced,0.04070399949947993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.01,0.040479999780654904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.01,0.10722559690475464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,balanced,0.042165334026018776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.01,0.04087679982185364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.01,0.04190720021724701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.01,0.1346943974494934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.01,0.04599680006504059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.01,0.04792959988117218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.01,0.13496960401535035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,balanced,0.19482133785883585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,balanced,0.05123733480771383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.01,0.04960640072822571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.01,0.19073280096054077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.01,0.05027840137481689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,balanced,0.05179733534653982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.01,0.20628480911254882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.01,0.05309439897537231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.01,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.01,0.27666559219360354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.01,0.061766397953033444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.01,0.33680000305175783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.01,0.06362239718437195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.01,0.5052351951599121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.01,0.06913920044898987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,balanced,0.2834346691767375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.01,0.7456128120422363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.01,0.08696320056915283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,balanced,0.05249066650867462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.01,0.08747519850730896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.01,0.8543744087219238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.01,0.11516799926757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,balanced,0.05880533158779144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,balanced,0.4326719840367635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.01,0.11978880167007447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.01,1.430521583557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.01,0.16522879600524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,power_law_1.01,0.03273600041866302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,balanced,0.06019733349482218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.01,0.21176960468292236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.01,2.650726318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,power_law_1.01,0.031040000915527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.01,0.2571135997772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,power_law_1.01,0.028780800104141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.01,0.33781120777130125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,power_law_1.01,0.03195520043373108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.01,0.5198336124420166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,balanced,0.34838934739430744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,balanced,0.0711946686108907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,power_law_1.01,0.03340159952640533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.01,0.6225024223327636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,32,power_law_1.2,0.052185600996017455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,power_law_1.01,0.035596799850463864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.01,0.7443071842193604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,balanced,0.07595733304818471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,power_law_1.01,0.037222400307655334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.01,1.307539176940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,32,power_law_1.2,0.04366079866886139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,power_law_1.01,0.03875199854373932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,32,power_law_1.2,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.01,2.902675247192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,power_law_1.01,0.03898240029811859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,32,power_law_1.2,0.046438398957252505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,power_law_1.01,0.04170239865779877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,32,power_law_1.2,0.05322239995002746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,balanced,0.09691199660301208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,power_law_1.01,0.044659200310707095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,32,power_law_1.2,0.055315202474594115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,power_law_1.01,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,balanced,0.4189866781234741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,32,power_law_1.2,0.05583360195159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,power_law_1.01,0.048640000820159915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,balanced,0.11050666371981303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,32,power_law_1.2,0.0572160005569458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,power_law_1.01,0.0571008026599884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,32,power_law_1.2,0.060224002599716185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,power_law_1.01,0.06064640283584595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,32,power_law_1.2,0.0606656014919281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,32,power_law_1.2,0.062015998363494876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,power_law_1.01,0.06480640172958374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,32,power_law_1.2,0.06341760158538819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,32,power_law_1.2,0.0718720018863678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,balanced,0.1502026617527008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,32,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,power_law_1.01,0.07162879705429077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,32,power_law_1.2,0.07631999850273133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,power_law_1.01,0.08208000063896179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,32,power_law_1.2,0.08528000116348267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,power_law_1.01,0.0882752001285553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,32,power_law_1.2,0.09607679843902588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,balanced,0.18502400318781534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,32,power_law_1.2,0.12526079416275024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,power_law_1.01,0.12216320037841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,balanced,0.8466506799062093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,power_law_1.01,0.14672640562057496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,32,power_law_1.2,0.1181056022644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,32,power_law_1.2,0.16122879981994628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,balanced,0.6411199967066447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,power_law_1.01,0.2000960111618042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,32,power_law_1.2,0.15905920267105103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,power_law_1.01,0.27489919662475587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,32,power_law_1.2,0.27923200130462644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,balanced,0.2760266661643982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,32,power_law_1.2,0.24992640018463136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,power_law_1.01,0.4130943775177002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,32,power_law_1.2,0.4557951927185059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,power_law_1.01,0.4606336116790771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,32,power_law_1.2,0.4902656078338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,power_law_1.01,0.7491007804870605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,32,power_law_1.2,0.7747712135314941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,power_law_1.01,1.1807168006896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,32,power_law_1.2,1.1629759788513183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,balanced,0.36393598715464276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,32,power_law_1.2,0.04481280148029328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,32,power_law_1.2,1.6224447250366212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,32,power_law_1.2,0.03405439853668213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,power_law_1.01,1.2469632148742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,32,power_law_1.2,2.734873580932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,32,power_law_1.2,0.03436160087585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,power_law_1.01,2.2805759429931642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,32,power_law_1.2,0.03694080114364624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,32,power_law_1.2,5.133440017700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,32,power_law_1.2,0.0380160003900528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,power_law_1.01,4.452659225463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,32,power_law_1.2,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,32,power_law_1.2,0.03937920033931732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,32,power_law_1.2,0.04214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,balanced,0.45579198996225995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,32,power_law_1.2,0.04607360064983368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,32,power_law_1.2,0.04748800098896026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,32,power_law_1.2,0.050316798686981204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,32,power_law_1.2,0.05175679922103882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,32,power_law_1.2,0.05677440166473389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,balanced,1.2352533340454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,32,power_law_1.2,0.05453439950942993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,32,power_law_1.2,0.06346240043640136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,32,power_law_1.2,0.06524159908294677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,32,power_law_1.2,0.07406079769134521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,32,power_law_1.2,0.08892160058021545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,32,power_law_1.2,0.09317759871482849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,balanced,0.696021318435669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,32,power_law_1.2,0.11564160585403442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,32,power_law_1.2,0.1396607995033264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,32,power_law_1.2,0.2057408094406128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,32,power_law_1.2,0.2568831920623779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,32,power_law_1.2,0.3285248041152954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,32,power_law_1.2,0.4280128002166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,32,power_law_1.2,0.8191488265991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,32,power_law_1.2,0.767033576965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,32,power_law_1.2,1.0894975662231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,32,power_law_1.2,2.2513216018676756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,32,power_law_1.2,4.999135971069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,balanced,0.03448000053564707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,balanced,0.034458667039871216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,32,power_law_1.2,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,balanced,0.03065599997838338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,32,power_law_1.2,0.029919999837875366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,balanced,0.04144000013669332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,32,power_law_1.2,0.02865920066833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,balanced,0.056133334835370384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,balanced,1.383680025736491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,32,power_law_1.2,0.03432320058345795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,balanced,0.05418666700522105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,32,power_law_1.2,0.03356159925460815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,32,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,balanced,0.054666668176651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,32,power_law_1.2,0.036473599076271054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,balanced,0.05877333382765452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,32,power_law_1.2,0.040249601006507874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,32,power_law_1.2,0.04162560105323791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,balanced,0.05815466741720835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,32,power_law_1.2,0.04271360039710999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,32,power_law_1.2,0.04517120122909546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,balanced,0.058117335041364036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,32,power_law_1.2,0.04890879988670349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,32,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,balanced,0.058965335289637245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,32,power_law_1.2,0.05826560258865356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,balanced,0.06029866635799408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,32,power_law_1.2,0.06335999965667724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,balanced,0.06021333237489065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,32,power_law_1.2,0.06993280053138733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,balanced,0.060880000392595925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,balanced,0.06526400148868561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,balanced,0.06528000036875407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,32,power_law_1.2,0.07447680234909057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,balanced,0.06804800033569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,32,power_law_1.2,0.09721599817276001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,balanced,0.07940266529719035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,32,power_law_1.2,0.09873279929161072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,balanced,0.07314133147398631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,32,power_law_1.2,0.1278272032737732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,balanced,0.03275733441114426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,32,power_law_1.2,0.19421440362930298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,balanced,0.08724266290664673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,balanced,0.03302400062481562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,balanced,0.03492266684770584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,balanced,0.08308800061543782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,32,power_law_1.2,0.27390079498291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,balanced,0.03688533355792364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,32,power_law_1.2,0.33271040916442873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,balanced,0.040709334115187325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,balanced,0.04231466849644979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,balanced,0.10897599657376607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,32,power_law_1.2,0.5551424026489258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,balanced,0.04306666553020477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,32,power_law_1.2,0.6759935855865479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,balanced,0.042810668547948204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,balanced,0.04321066538492838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,32,power_law_1.2,1.251136016845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,balanced,0.11582932869593303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,balanced,0.0439573327700297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,32,power_law_1.2,2.0065280914306642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,balanced,0.04568533102671305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,balanced,0.045642669002215065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,balanced,0.04740266501903534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,32,power_law_1.2,2.0137792587280274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,balanced,0.16127467155456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,balanced,0.05032533407211304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,32,power_law_1.2,3.4547840118408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,balanced,0.05644799768924713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,balanced,0.056554665168126426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,32,power_law_1.2,9.61193618774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.01,0.05226879715919495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,balanced,0.0603359987338384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,balanced,0.18016533056894937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,balanced,0.07023466626803081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.01,0.045747199654579164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.01,0.03805440068244934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,balanced,0.07066666583220164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.01,0.0441536009311676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,balanced,0.08531199892361958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.01,0.04769920110702515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,balanced,0.09289600451787312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.01,0.0523967981338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,balanced,0.0277813325325648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,balanced,0.27319467067718506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.01,0.05315200090408325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.01,0.04476799964904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,balanced,0.02757333219051361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,balanced,0.1172213355700175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.01,0.056505602598190305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,balanced,0.028186666468779247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.01,0.037088000774383546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.01,0.05604479908943176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,balanced,0.03125333289305369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.01,0.03619199991226196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,balanced,0.036703998843828835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.01,0.05763840079307556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,balanced,0.13355200489362082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.01,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,balanced,0.03864533454179764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.01,0.04014720022678375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.01,0.0630400002002716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,balanced,0.03868799904982249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.01,0.06445440053939819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,balanced,0.03850133220354716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.01,0.042745599150657655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.01,0.06476799845695495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,balanced,0.33001599709192914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,balanced,0.040074666341145836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.01,0.042284798622131345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,balanced,0.1850879987080892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.01,0.0652288019657135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,balanced,0.041135999063650765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.01,0.043993601202964784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.01,0.07100800275802613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,balanced,0.04160533348719279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.01,0.045824000239372255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.01,0.07269759774208069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,balanced,0.042821332812309265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.01,0.07998719811439514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.01,0.04803839921951294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,balanced,0.044122666120529175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.01,0.0990015983581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.01,0.048640000820159915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,balanced,0.2273120085398356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.01,0.09335039854049683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,balanced,0.04558933277924856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.01,0.050246399641036985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.01,0.12768640518188476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.01,0.05235840082168579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.01,0.13100160360336305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.01,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.01,0.17538559436798096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,balanced,0.05420266588528951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.01,0.061222398281097413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.01,0.18632320165634156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,balanced,0.37911466757456463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.01,0.2673151969909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,balanced,0.05494399865468343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.01,0.06316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.01,0.3723839998245239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.01,0.07103360295295716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.01,0.4537087917327881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.01,0.08275200128555298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,balanced,0.33553067843119305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.01,0.6052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.01,0.08377599716186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.01,0.10722559690475464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.01,0.8103679656982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.01,0.12609920501708985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,balanced,0.05804799993832906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.01,1.3484928131103515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.01,0.17091200351715088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,balanced,0.06586666901906331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.01,2.7445568084716796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.01,0.19413119554519653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.01,0.27808640003204343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,balanced,0.06793599824110667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.01,0.3205375909805298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,power_law_1.01,0.03581439852714539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,balanced,0.4227413336435954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.01,0.45871357917785643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,power_law_1.01,0.030668801069259642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.01,0.7027200222015381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,balanced,0.0841919978459676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,power_law_1.01,0.029023998975753786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.01,0.7948031902313233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,balanced,0.5564746856689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,power_law_1.01,0.03463039994239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,balanced,0.09149332841237386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,power_law_1.01,0.03585920035839081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.01,1.587667179107666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,power_law_1.01,0.03740800023078918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,power_law_1.01,0.03769600093364715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.01,2.8893823623657227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,power_law_1.01,0.04246399998664856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,power_law_1.01,0.043296000361442565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,balanced,0.5102666616439819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,balanced,0.12149332960446675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,power_law_1.01,0.0466623991727829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,16,power_law_1.2,0.05141760110855102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,power_law_1.01,0.04880000054836273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,16,power_law_1.2,0.037836799025535585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,balanced,0.14392000436782837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,power_law_1.01,0.052249598503112796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,16,power_law_1.2,0.03868800103664398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,16,power_law_1.2,0.04357759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,power_law_1.01,0.05682560205459595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,16,power_law_1.2,0.04709759950637817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,16,power_law_1.2,0.05430399775505066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,power_law_1.01,0.06495360136032105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,16,power_law_1.2,0.05480960011482239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,16,power_law_1.2,0.05800960063934326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,power_law_1.01,0.06689919829368592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,16,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,16,power_law_1.2,0.059033602476119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,balanced,0.218341330687205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,16,power_law_1.2,0.0598143994808197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,power_law_1.01,0.07290239930152893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,16,power_law_1.2,0.0643775999546051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,16,power_law_1.2,0.06417279839515685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,power_law_1.01,0.08570880293846131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,16,power_law_1.2,0.06673920154571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,power_law_1.01,0.10223360061645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,16,power_law_1.2,0.0725055992603302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,balanced,0.28301332394282025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,16,power_law_1.2,0.07690879702568054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,balanced,0.7637973626454672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,power_law_1.01,0.12023680210113526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,16,power_law_1.2,0.08767359852790832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,16,power_law_1.2,0.10555520057678222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,power_law_1.01,0.15633920431137086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,16,power_law_1.2,0.10144000053405762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,16,power_law_1.2,0.12799359560012818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,power_law_1.01,0.23871359825134278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,16,power_law_1.2,0.1356160044670105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,power_law_1.01,0.31164801120758057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,16,power_law_1.2,0.21566081047058105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,balanced,0.40607468287150067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,16,power_law_1.2,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,16,power_law_1.2,0.2991872072219849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,power_law_1.01,0.39969279766082766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,balanced,1.0677013397216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,16,power_law_1.2,0.3650559902191162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,power_law_1.01,0.613920021057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,16,power_law_1.2,0.586630392074585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,power_law_1.01,0.935916805267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,16,power_law_1.2,0.875487995147705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,power_law_1.01,1.0433600425720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,16,power_law_1.2,1.1103103637695313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,power_law_1.01,1.4883904457092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,16,power_law_1.2,1.9490240097045899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,power_law_1.01,2.1232511520385744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,balanced,0.5242986679077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,16,power_law_1.2,5.107891082763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,power_law_1.01,4.265990447998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,16,power_law_1.2,0.04447360038757324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,balanced,0.6490559975306193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,16,power_law_1.2,0.034483200311660765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,16,power_law_1.2,0.03671039938926697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,16,power_law_1.2,0.03611519932746887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,16,power_law_1.2,0.03922559916973114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,16,power_law_1.2,0.042483198642730716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,balanced,1.4987680117289226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,16,power_law_1.2,0.042656001448631284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,16,power_law_1.2,0.04437119960784912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,16,power_law_1.2,0.04503040015697479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,16,power_law_1.2,0.04700160026550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,16,power_law_1.2,0.05055360198020935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,16,power_law_1.2,0.05317760109901428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,16,power_law_1.2,0.05367040038108826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,16,power_law_1.2,0.05454080104827881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,16,power_law_1.2,0.06481919884681701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,balanced,1.0070079962412517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,16,power_law_1.2,0.06906880140304565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,16,power_law_1.2,0.07237759828567505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,16,power_law_1.2,0.08858879804611205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,16,power_law_1.2,0.09944319725036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,16,power_law_1.2,0.11418240070343018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,16,power_law_1.2,0.13228800296783447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,16,power_law_1.2,0.19203840494155883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,16,power_law_1.2,0.2566783905029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,16,power_law_1.2,0.3627327919006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,16,power_law_1.2,0.458892822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,16,power_law_1.2,0.6761343955993653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,16,power_law_1.2,0.9530879974365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,16,power_law_1.2,1.1156352043151856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,16,power_law_1.2,2.013932800292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,16,power_law_1.2,4.435718536376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,16,power_law_1.2,0.03607040047645569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,16,power_law_1.2,0.029497599601745604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,16,power_law_1.2,0.030131199955940248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,16,power_law_1.2,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,16,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,16,power_law_1.2,0.038848000764846805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,16,power_law_1.2,0.03951359987258911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,balanced,1.9986613591512044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,16,power_law_1.2,0.04248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,16,power_law_1.2,0.04414080083370209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,balanced,0.03291733314593633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,16,power_law_1.2,0.04376960098743439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,balanced,0.029626667499542236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,16,power_law_1.2,0.048582398891448976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,balanced,0.03105599929889043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,16,power_law_1.2,0.05132799744606018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,balanced,0.039605334401130676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,16,power_law_1.2,0.05325440168380737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,balanced,0.05468800167242686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,16,power_law_1.2,0.06113280057907104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,balanced,0.05589333176612854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,16,power_law_1.2,0.06884480118751526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,balanced,0.05603733162085215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,balanced,0.05646933118502299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,16,power_law_1.2,0.07388799786567687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,balanced,0.05705599983533224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,balanced,0.05804799993832906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,16,power_law_1.2,0.07806079983711242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,balanced,0.058373332023620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,balanced,0.05899199843406677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,16,power_law_1.2,0.09315840005874634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,balanced,0.060421332716941833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,16,power_law_1.2,0.10526080131530761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,balanced,0.06462400158246358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,balanced,0.06773333251476288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,16,power_law_1.2,0.14139519929885863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,balanced,0.06880533198515575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,16,power_law_1.2,0.189792001247406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,balanced,0.07234666744867961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,16,power_law_1.2,0.25925118923187257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,balanced,0.08577066659927368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,16,power_law_1.2,0.32067840099334716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,balanced,0.081386665503184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,balanced,0.0983893374602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,16,power_law_1.2,0.4942463874816895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,balanced,0.033002667129039764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,16,power_law_1.2,0.7021632194519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,balanced,0.09815466403961182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,balanced,0.032826667030652366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,16,power_law_1.2,1.1591872215270995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,balanced,0.03634133438269297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.01,0.04102399945259094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,16,power_law_1.2,1.8608831405639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,balanced,0.0395413339138031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,balanced,0.1344533363978068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.01,0.04028800129890442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,balanced,0.04649066428343455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,16,power_law_1.2,2.0035327911376952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.01,0.03650560081005096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,balanced,0.04720533390839895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.01,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,balanced,0.046623999873797096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,balanced,0.1479573349157969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.01,0.049958398938179015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,16,power_law_1.2,3.378355026245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,balanced,0.04833066463470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.01,0.05438719987869263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,balanced,0.028959999481836956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.01,0.055302399396896365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,balanced,0.04800533254941305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,balanced,0.030559999247392017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,16,power_law_1.2,8.881881713867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.01,0.0576960027217865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,balanced,0.04933333396911621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,balanced,0.030762667457262676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,balanced,0.21337066094080606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.01,0.05917440056800842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,balanced,0.05003199974695841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.01,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,balanced,0.05087466537952423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,balanced,0.038746667404969536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,balanced,0.04087999959786733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,balanced,0.052282666166623436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.01,0.06445440053939819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,balanced,0.04344533383846283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,balanced,0.05363733569780985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.01,0.0648959994316101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,balanced,0.04252266883850098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,balanced,0.2508959968884786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,balanced,0.044362664222717285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,balanced,0.059893334905306496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.01,0.06561279892921448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.01,0.03769600093364715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,balanced,0.04524800181388855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,balanced,0.06081066528956095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.01,0.067603200674057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,balanced,0.04719999929269155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.01,0.0344895988702774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,balanced,0.06608533362547557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.01,0.0738431990146637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,balanced,0.049360002080599465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.01,0.03607679903507233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,balanced,0.07789333164691925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,balanced,0.050928001602490745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.01,0.07956479787826538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.01,0.03738240003585815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,balanced,0.05263466636339823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.01,0.08791679739952088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,balanced,0.3805546760559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,balanced,0.07796800136566162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.01,0.0409855991601944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.01,0.09804800152778625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.01,0.04652799963951111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,balanced,0.09531199932098389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,balanced,0.06477333108584087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.01,0.10255359411239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.01,0.046188798546791074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,balanced,0.06384000182151794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.01,0.047225600481033324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.01,0.11463680267333984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,balanced,0.1014453371365865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.01,0.048895999789237976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.01,0.13511680364608764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.01,0.04987519979476929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.01,0.17059199810028075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,balanced,0.13968533277511597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.01,0.051123201847076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.01,0.21121280193328856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.01,0.05482239723205566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,balanced,0.4692213137944539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.01,0.28177919387817385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,balanced,0.06972800195217133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.01,0.056383997201919556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,balanced,0.16677866379419962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.01,0.3808255910873413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.01,0.05861120223999024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,balanced,0.08381866415341695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.01,0.5232511997222901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.01,0.06318719983100891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,balanced,0.08533333738644917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.01,0.06801279783248901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.01,0.7495168209075928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.01,0.0762880027294159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,balanced,0.24021865924199423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.01,0.8404352188110351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.01,0.0841152012348175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.01,1.3376319885253907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.01,0.09501439929008484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,balanced,0.11028800408045451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.01,0.11822079420089722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.01,2.558022308349609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.01,0.12885760068893432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,balanced,0.12779733538627625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,balanced,0.3000640074412028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.01,0.17697919607162477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,balanced,0.5645120143890381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.01,0.22828800678253175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.01,0.3073920011520386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.01,0.4207295894622803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.01,0.6074687957763671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,balanced,0.19661333163579306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.01,0.7315904140472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,balanced,0.44569067160288495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.01,0.9368512153625488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,balanced,0.24702399969100952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.01,1.5005951881408692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.01,3.0605567932128905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,balanced,0.35207998752593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,balanced,0.5781173308690389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,power_law_1.01,0.035180801153182985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,balanced,0.813103993733724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,power_law_1.01,0.03191039860248566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,balanced,0.45127467314402264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,power_law_1.01,0.035545599460601804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,8,power_law_1.2,0.03984639942646027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,power_law_1.01,0.04399999976158142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,8,power_law_1.2,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,power_law_1.01,0.04542079865932465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,8,power_law_1.2,0.0378495991230011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,power_law_1.01,0.04716159999370575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,8,power_law_1.2,0.043110400438308716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,balanced,0.6553920110066732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,balanced,0.7040692965189616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,8,power_law_1.2,0.04385280013084412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,power_law_1.01,0.05127040147781372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,8,power_law_1.2,0.05397760272026062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,power_law_1.01,0.052275198698043826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,8,power_law_1.2,0.05648639798164368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,8,power_law_1.2,0.05889279842376709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,power_law_1.01,0.060166400671005246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,8,power_law_1.2,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,power_law_1.01,0.060627198219299315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,8,power_law_1.2,0.05926399827003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,power_law_1.01,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,8,power_law_1.2,0.0648639976978302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,8,power_law_1.2,0.0659712016582489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,8,power_law_1.2,0.06609280109405517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,power_law_1.01,0.07109119892120361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,balanced,0.8508853117624918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,8,power_law_1.2,0.06974719762802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,power_law_1.01,0.07516800165176392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,8,power_law_1.2,0.076665598154068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,8,power_law_1.2,0.08448640108108521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,8,power_law_1.2,0.08903040289878845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,power_law_1.01,0.08284159898757934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,8,power_law_1.2,0.1034816026687622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,power_law_1.01,0.10049279928207397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,8,power_law_1.2,0.10434559583663941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,power_law_1.01,0.12263679504394531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,8,power_law_1.2,0.13370879888534545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,balanced,1.045525312423706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,8,power_law_1.2,0.141702401638031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,power_law_1.01,0.15724159479141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,8,power_law_1.2,0.21050240993499755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,8,power_law_1.2,0.22232320308685302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,power_law_1.01,0.19411200284957886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,balanced,1.0556053320566814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,8,power_law_1.2,0.3235136032104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,8,power_law_1.2,0.5215551853179932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,power_law_1.01,0.2808511972427368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,8,power_law_1.2,0.7163455963134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,balanced,1.5849706331888835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,8,power_law_1.2,0.8495231628417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,power_law_1.01,0.3709887981414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,8,power_law_1.2,1.1813823699951171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,8,power_law_1.2,2.0934528350830077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,power_law_1.01,0.5612224102020263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,8,power_law_1.2,4.763872146606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,power_law_1.01,0.7717567920684815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,power_law_1.01,1.154470443725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,8,power_law_1.2,0.03783040046691895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,power_law_1.01,1.467737579345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,8,power_law_1.2,0.032492798566818235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,power_law_1.01,1.9148351669311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,balanced,1.6635680198669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,8,power_law_1.2,0.03553920090198517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,8,power_law_1.2,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,power_law_1.01,3.095097541809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,8,power_law_1.2,0.04069119989871979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,8,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,power_law_1.01,5.8495231628417965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,8,power_law_1.2,0.04758400022983551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,8,power_law_1.2,0.04764159917831421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,8,power_law_1.2,0.04958080053329468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,8,power_law_1.2,0.049804800748825075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,8,power_law_1.2,0.05173119902610779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,8,power_law_1.2,0.0561024010181427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,balanced,2.0569279988606772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,8,power_law_1.2,0.05822719931602478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,8,power_law_1.2,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,8,power_law_1.2,0.06387199759483338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,8,power_law_1.2,0.0700160026550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,8,power_law_1.2,0.08270080089569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,8,power_law_1.2,0.08729599714279175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,8,power_law_1.2,0.09770879745483399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,8,power_law_1.2,0.12234879732131958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,8,power_law_1.2,0.1427839994430542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,8,power_law_1.2,0.18647040128707887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,8,power_law_1.2,0.2482367992401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,8,power_law_1.2,0.35358080863952634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,8,power_law_1.2,0.5322303771972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,balanced,3.30130672454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,8,power_law_1.2,0.7715519905090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,8,power_law_1.2,1.1872320175170898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,8,power_law_1.2,1.0747455596923827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,8,power_law_1.2,2.1929599761962892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,8,power_law_1.2,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,8,power_law_1.2,4.034380722045898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,8,power_law_1.2,0.03129599988460541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,8,power_law_1.2,0.032332798838615416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,balanced,0.035216001172860466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,8,power_law_1.2,0.035257598757743834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,balanced,0.03572266548871994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,8,power_law_1.2,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,balanced,0.0439626673857371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,8,power_law_1.2,0.043859198689460754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,balanced,0.04786133269468943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,8,power_law_1.2,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,balanced,0.06166933476924896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,8,power_law_1.2,0.04764159917831421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,balanced,0.06334400177001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,balanced,0.06399466594060262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,8,power_law_1.2,0.0492031991481781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,balanced,0.06435200075308482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,8,power_law_1.2,0.05143679976463318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,balanced,0.06414933502674103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,8,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,balanced,0.06465066472689311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,8,power_law_1.2,0.05607680082321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,balanced,0.0658240020275116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,8,power_law_1.2,0.06173440217971802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,balanced,0.06691733499368031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,8,power_law_1.2,0.06755840182304382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,balanced,0.06799999872843425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,balanced,0.07032533486684163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,8,power_law_1.2,0.07517439723014832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,balanced,0.07563200096289317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,8,power_law_1.2,0.07803519964218139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,balanced,0.07761600116888683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,balanced,0.08249066770076752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,balanced,0.09487467010815938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,8,power_law_1.2,0.09010559916496277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,balanced,0.0976586639881134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,8,power_law_1.2,0.10826879739761353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,balanced,0.115365336338679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,8,power_law_1.2,0.12305279970169067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,balanced,0.12990400195121765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,8,power_law_1.2,0.19122560024261476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,8,power_law_1.2,0.2366015911102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,balanced,0.17689067125320435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,8,power_law_1.2,0.3171776056289673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,8,power_law_1.2,0.4309375762939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,balanced,0.21920533974965414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,8,power_law_1.2,0.7060800075531006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,balanced,0.03339733431736628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,8,power_law_1.2,0.9388352394104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,balanced,0.3163573344548543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,8,power_law_1.2,1.4398079872131349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,balanced,0.033861334125200905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,balanced,0.03577066709597906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,8,power_law_1.2,2.042246437072754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,balanced,0.041834667325019836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,8,power_law_1.2,2.555571174621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,balanced,0.05050133168697357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,balanced,0.4293493429819743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,balanced,0.05134400228659312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,8,power_law_1.2,4.510982513427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,balanced,0.05340266724427541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,balanced,0.05199466645717621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,balanced,0.05384533107280731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,8,power_law_1.2,8.376838684082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,balanced,0.05618133147557577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,balanced,0.6162346601486206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,balanced,0.05961066484451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,balanced,0.059802666306495667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,balanced,0.061679999033610024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,balanced,0.06957866748174031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,balanced,0.07027733325958252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.01,0.03787519931793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,balanced,0.07735999921957652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.01,0.04590719938278198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,balanced,0.8007466793060303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,balanced,0.08682133754094441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.01,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.01,0.04601599872112274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,balanced,0.0941973328590393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.01,0.04940159916877747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.01,0.06159999966621399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,balanced,0.11300800244013469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.01,0.06267520189285278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,balanced,0.12966932853062949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.01,0.035392001271247864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.01,0.06399359703063964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.01,0.06558079719543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.01,0.035718399286270144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,balanced,0.18141865730285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.01,0.06773120164871216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.01,0.035148799419403076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.01,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.01,0.03927040100097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,balanced,0.9825653235117594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,balanced,0.22622400522232056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.01,0.06951680183410644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.01,0.04350079894065857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.01,0.07056000232696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.01,0.04991360008716583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.01,0.07582079768180847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.01,0.05136640071868896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,balanced,0.3492106596628825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.01,0.05149440169334411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.01,0.08328959941864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.01,0.08535040020942689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.01,0.05532159805297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.01,0.09165440201759338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.01,0.05807999968528747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.01,0.11593600511550903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,balanced,0.4658133188883464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.01,0.06124160289764404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.01,0.06412799954414368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.01,0.1165120005607605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.01,0.06673280000686646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.01,0.1488703966140747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.01,0.0750656008720398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.01,0.15562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.01,0.07951359748840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.01,0.21016960144042968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.01,0.08417919874191285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,balanced,0.6822453339894613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.01,0.10272639989852905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,balanced,1.404655933380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.01,0.24662399291992188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.01,0.11140480041503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.01,0.386406397819519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.01,0.1364416003227234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.01,0.5555456161499024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.01,0.16533759832382203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.01,0.23363199234008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.01,0.7329984188079834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.01,0.2824959993362427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,4,power_law_1.2,0.03790720105171204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.01,1.122208023071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.01,0.40380158424377444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,4,power_law_1.2,0.03544960021972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.01,0.5322624206542969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.01,1.103321647644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,4,power_law_1.2,0.03776000142097473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,balanced,0.8269866307576498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,4,power_law_1.2,0.044198399782180785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.01,0.8305983543395996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.01,2.139846420288086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,4,power_law_1.2,0.050547200441360476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.01,1.0476096153259278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,4,power_law_1.2,0.06047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.01,1.3243071556091308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,4,power_law_1.2,0.0627776026725769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.01,3.9920574188232423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,4,power_law_1.2,0.06442880034446716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.01,2.0705791473388673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,4,power_law_1.2,0.06533759832382202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,4,power_law_1.2,0.06458240151405334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,4,power_law_1.2,0.06787199974060058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.01,4.201772689819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,4,power_law_1.2,0.07063040137290955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,4,power_law_1.2,0.07311999797821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,4,power_law_1.2,0.07832319736480713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,balanced,1.0447359879811604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,4,power_law_1.2,0.08418560028076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,4,power_law_1.2,0.0873856008052826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,4,power_law_1.2,0.09409279823303222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,4,power_law_1.2,0.1174015998840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,4,power_law_1.2,0.11463040113449097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,4,power_law_1.2,0.14494080543518068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,4,power_law_1.2,0.1590208053588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,4,power_law_1.2,0.2491391897201538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,4,power_law_1.2,0.28243839740753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,4,power_law_1.2,0.42500481605529783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,4,power_law_1.2,0.5274816036224366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,4,power_law_1.2,0.8944448471069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,balanced,2.7386452356974282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,4,power_law_1.2,1.106163215637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,4,power_law_1.2,1.5210944175720216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,4,power_law_1.2,2.4413503646850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,balanced,1.6142667134602864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,4,power_law_1.2,5.93304328918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,4,power_law_1.2,0.03530240058898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,4,power_law_1.2,0.03344640135765076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,4,power_law_1.2,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,4,power_law_1.2,0.04008319973945618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,4,power_law_1.2,0.04359680116176605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,4,power_law_1.2,0.049983999133110045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,4,power_law_1.2,0.051686400175094606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,4,power_law_1.2,0.05306239724159241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,4,power_law_1.2,0.05448960065841675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,4,power_law_1.2,0.055769598484039305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,4,power_law_1.2,0.05873280167579651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,4,power_law_1.2,0.06342399716377259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,4,power_law_1.2,0.0649407982826233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,balanced,3.1992212931315103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,4,power_law_1.2,0.06766080260276794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,4,power_law_1.2,0.07614719867706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,4,power_law_1.2,0.0806335985660553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,4,power_law_1.2,0.09025279879570007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,4,power_law_1.2,0.10359679460525513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,4,power_law_1.2,0.11475839614868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,4,power_law_1.2,0.14647040367126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,4,power_law_1.2,0.17951359748840331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,4,power_law_1.2,0.23264000415802003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,4,power_law_1.2,0.2957887887954712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,4,power_law_1.2,0.4631552219390869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,4,power_law_1.2,0.6077631950378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,4,power_law_1.2,0.9389504432678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,4,power_law_1.2,1.1922880172729493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,4,power_law_1.2,1.5551744461059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,4,power_law_1.2,2.333945655822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,4,power_law_1.2,5.4424385070800785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,balanced,0.036746665835380554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,balanced,0.03755733370780945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,balanced,0.03484266748030981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,balanced,0.048197334011395775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,balanced,0.057717333237330117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,balanced,0.0364479993780454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,balanced,0.0709440012772878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,balanced,0.042730664213498436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,balanced,0.07314666608969371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,balanced,0.05020800232887268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,balanced,0.07411199808120728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,balanced,0.06419733166694641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,balanced,0.07527466615041097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,balanced,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,balanced,0.07746666669845581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,balanced,0.07655466596285503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,balanced,0.06829866766929626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,balanced,0.08352532982826233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,balanced,0.06769600013891856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,balanced,0.07992533346017201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,balanced,0.08566400408744812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,balanced,0.06865066786607106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,balanced,0.08799466490745544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,balanced,0.0911253293355306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,balanced,0.07048533360163371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,balanced,0.09384000301361084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,balanced,0.07122666637102763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,balanced,0.10754133264223735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,balanced,0.0751146674156189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,balanced,0.12129599849383037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,balanced,0.07605866591135661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.01,0.037062400579452516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,balanced,0.13454932967821756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,balanced,0.08062933385372162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.01,0.0366784006357193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,balanced,0.08782399694124858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,balanced,0.16149333119392395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,balanced,0.09283733367919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,balanced,0.18734399477640787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.01,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,balanced,0.10627200206120808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.01,0.054630398750305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,balanced,0.26768000920613605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.01,0.06926720142364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,balanced,0.11713066697120667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.01,0.07190399765968322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.01,0.03478400111198425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,balanced,0.13200533390045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.01,0.07427200078964233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,balanced,0.3367893298467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.01,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.01,0.07599999904632568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,balanced,0.15942399700482687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.01,0.040006399154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.01,0.07682560086250305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.01,0.04627200067043304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.01,0.08074880242347718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.01,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,balanced,0.19179733594258627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.01,0.08344320058822632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,balanced,0.5498613516489664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.01,0.06135680079460144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.01,0.08362240195274354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.01,0.06249600052833557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.01,0.09082239866256714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.01,0.06392319798469544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,balanced,0.27585599819819134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.01,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.01,0.09649919867515563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.01,0.06915199756622314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.01,0.11196160316467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.01,0.0742464005947113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,balanced,0.7232000033060709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.01,0.11213439702987671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,balanced,0.34198399384816486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.01,0.07897599935531616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.01,0.14291839599609374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.01,0.0821183979511261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.01,0.1527999997138977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.01,0.085971200466156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.01,0.17893120050430297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.01,0.0971455991268158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.01,0.22038400173187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.01,0.1053887963294983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,balanced,0.5449493328730265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.01,0.31704959869384763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.01,0.11064319610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.01,0.1312384009361267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.01,0.4047999858856201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,balanced,1.07041597366333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.01,0.15072640180587768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.01,0.5635647773742676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.01,0.19704320430755615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.01,0.7176896095275879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.01,0.22426879405975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,balanced,0.760703961054484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.01,0.3142528057098389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.01,1.0784192085266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.01,0.3834559917449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.01,1.3758655548095704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.01,0.5940095901489257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.01,1.8179136276245118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.01,0.7731008052825927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.01,1.1840127944946288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.01,2.9913984298706056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.01,1.4862848281860352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,balanced,1.3004000186920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.01,1.8569856643676759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.01,6.088735961914063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,balanced,1.1454613208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.01,3.257497787475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.01,6.185311889648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,balanced,1.4047733942667644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,balanced,1.6303680737813313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,balanced,1.7592639923095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,balanced,2.547621409098307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,2,power_law_1.2,0.036934399604797365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,2,power_law_1.2,0.035046398639678955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,2,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,2,power_law_1.2,0.035078400373458864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,2,power_law_1.2,0.044844800233840944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,2,power_law_1.2,0.048256000876426695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,2,power_law_1.2,0.03994880020618439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,2,power_law_1.2,0.0522816002368927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,2,power_law_1.2,0.0457152009010315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,2,power_law_1.2,0.05008640289306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,2,power_law_1.2,0.06813439726829529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,2,power_law_1.2,0.0610368013381958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,2,power_law_1.2,0.07445759773254394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,balanced,2.7817068099975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,2,power_law_1.2,0.06356480121612548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,2,power_law_1.2,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,2,power_law_1.2,0.06686720252037048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,2,power_law_1.2,0.07587199807167053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,2,power_law_1.2,0.0698303997516632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,2,power_law_1.2,0.0765887975692749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,2,power_law_1.2,0.07140480279922486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,2,power_law_1.2,0.08288000226020813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,2,power_law_1.2,0.0753600001335144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,2,power_law_1.2,0.08195199966430664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,2,power_law_1.2,0.0807807981967926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,2,power_law_1.2,0.08511360287666321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,2,power_law_1.2,0.0846015989780426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,2,power_law_1.2,0.09260159730911255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,2,power_law_1.2,0.08773120045661927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,2,power_law_1.2,0.10033919811248779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,2,power_law_1.2,0.09883520007133484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,2,power_law_1.2,0.11204479932785034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,2,power_law_1.2,0.10805759429931641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,2,power_law_1.2,0.1160256028175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,2,power_law_1.2,0.11390080451965331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,2,power_law_1.2,0.1512511968612671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,2,power_law_1.2,0.1368127942085266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,2,power_law_1.2,0.15521279573440552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,2,power_law_1.2,0.14820480346679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,2,power_law_1.2,0.19575680494308473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,2,power_law_1.2,0.19633920192718507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,2,power_law_1.2,0.23088641166687013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,2,power_law_1.2,0.24078719615936278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,2,power_law_1.2,0.3230400085449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,2,power_law_1.2,0.3104127883911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,2,power_law_1.2,0.4060800075531006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,2,power_law_1.2,0.3958911895751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,balanced,5.0475358963012695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,2,power_law_1.2,0.589299201965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,2,power_law_1.2,0.6036799907684326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,2,power_law_1.2,0.8049728393554687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,2,power_law_1.2,0.8108863830566406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,2,power_law_1.2,1.212940788269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,2,power_law_1.2,1.3077887535095214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,2,power_law_1.2,1.633977508544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,2,power_law_1.2,1.478553581237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,2,power_law_1.2,2.018783950805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,2,power_law_1.2,1.9638912200927734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,2,power_law_1.2,3.560230255126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,2,power_law_1.2,3.1522560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,balanced,5.5484161376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,2,power_law_1.2,6.674642944335938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,2,power_law_1.2,7.0553535461425785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,balanced,0.07020799815654755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,balanced,0.052015999952952065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,balanced,0.0662773350874583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,balanced,0.06012799839178721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,balanced,0.054229333996772766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,balanced,0.07531733314196269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,balanced,0.049653331438700356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,balanced,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,balanced,0.061093335350354515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,balanced,0.12598933776219687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,balanced,0.08053333560625713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,balanced,0.12644267082214355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,balanced,0.08835732936859131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,balanced,0.12743999560674033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,balanced,0.09032533566157024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,balanced,0.12868266304334006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,balanced,0.09063999851544698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,balanced,0.1281013290087382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,balanced,0.12302933136622111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,balanced,0.09127466877301534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,balanced,0.09165866176287334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,balanced,0.12397332986195882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,balanced,0.09311466415723164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,balanced,0.12447999914487202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,balanced,0.09364799658457439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,balanced,0.1320799986521403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,balanced,0.0953653355439504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,balanced,0.1360266705354055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,balanced,0.13834133744239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,balanced,0.09708266456921895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,balanced,0.1411946713924408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,balanced,0.10261866450309753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,balanced,0.10412800312042236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,balanced,0.1486186683177948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,balanced,0.10938133796056111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,balanced,0.1532799998919169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,balanced,0.11736533045768738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,balanced,0.1758613387743632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,balanced,0.1267039974530538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,balanced,0.17550400892893472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,balanced,0.15213333566983542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,balanced,0.23009065786997476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,balanced,0.16013866662979126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,balanced,0.044922664761543274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,balanced,0.22318933407465616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,balanced,0.21022399266560873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,balanced,0.045610666275024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,balanced,0.06154133379459381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,balanced,0.08142933249473572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,balanced,0.2302666703859965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,balanced,0.32472532987594604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,balanced,0.08354666829109192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,balanced,0.08494933446248372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,balanced,0.0853653351465861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,balanced,0.085807998975118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,balanced,0.3256853421529134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,balanced,0.08684266606966655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,balanced,0.088128000497818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,balanced,0.3635093371073405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,balanced,0.08821866909662883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,balanced,0.09059199690818787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,balanced,0.0909493366877238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,balanced,0.09604266285896301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,balanced,0.38822933038075763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,balanced,0.5129813353220621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,balanced,0.09682133793830872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.01,0.1257599949836731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,balanced,0.5547039906183878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.01,0.1054527997970581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.01,0.07874559760093688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,balanced,0.10257599751154582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.01,0.09377920031547546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,balanced,0.6465813318888346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.01,0.09722880125045777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.01,0.12193280458450317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.01,0.12278399467468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.01,0.12348799705505371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.01,0.11838719844818116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,balanced,0.6939466794331869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.01,0.1189568042755127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.01,0.12396800518035889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.01,0.12916480302810668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,balanced,0.11096533139546712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.01,0.1336192011833191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,balanced,0.1200320025285085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.01,0.14071680307388307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,balanced,0.7517600059509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.01,0.14648959636688233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.01,0.15576959848403932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.01,0.15048320293426515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.01,0.16766079664230346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.01,0.08721920251846313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.01,0.19838720560073853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,balanced,0.8547093073527018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.01,0.24128639698028564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.01,0.08022400140762329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.01,0.2857280015945435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.01,0.06104959845542908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.01,0.3993216037750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,balanced,0.1365066667397817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,2,32,power_law_1.2,0.1259071946144104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.01,0.06775680184364319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.01,0.3931391954421997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.01,0.0803712010383606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,balanced,0.15078933040301004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.01,0.558131217956543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,2,32,power_law_1.2,0.08834559917449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.01,0.08605440258979798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.01,0.6636864185333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,2,32,power_law_1.2,0.06872959733009339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,power_law_1.01,0.07879679799079894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.01,0.08860160112380981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.01,1.095564842224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,balanced,0.19775466124216715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,2,32,power_law_1.2,0.08588799834251404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.01,0.08531839847564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,power_law_1.01,0.07810559868812561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.01,1.5609024047851563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,2,32,power_law_1.2,0.09411839842796325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.01,0.08870400190353393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,power_law_1.01,0.05608320236206055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.01,1.899500846862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.01,0.08869119882583618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,2,32,power_law_1.2,0.11846400499343872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,balanced,0.22728000084559122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,balanced,1.1180480321248372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,power_law_1.01,0.06880000233650208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.01,2.756780815124512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.01,0.08895999789237977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,2,32,power_law_1.2,0.12289279699325562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,power_law_1.01,0.07315840125083924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.01,0.09685760140419006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,2,32,power_law_1.2,0.12066559791564942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.01,6.411968231201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,power_law_1.01,0.08025599718093872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.01,0.09359359741210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,2,32,power_law_1.2,0.12320640087127685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,power_law_1.01,0.08327680230140685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,balanced,0.31627732515335083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.01,0.10386559963226319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,power_law_1.01,0.0864960014820099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,2,32,power_law_1.2,0.1256832003593445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,balanced,1.2712533473968506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.01,0.10517120361328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,power_law_1.01,0.08388479948043823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,2,32,power_law_1.2,0.12653440237045288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.01,0.10983680486679077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,power_law_1.01,0.09171839952468872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,2,32,power_law_1.2,0.13263360261917115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,power_law_1.01,0.09383040070533752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.01,0.11768959760665894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,2,32,power_law_1.2,0.13735040426254272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,balanced,0.4175413449605306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,power_law_1.01,0.09791359901428223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.01,0.13477760553359985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,2,32,power_law_1.2,0.14024959802627562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,power_law_1.01,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.01,0.15852799415588378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,2,32,power_law_1.2,0.14675840139389038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,2,32,power_law_1.2,0.08737279772758484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,power_law_1.01,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.01,0.19271039962768555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,2,32,power_law_1.2,0.16209280490875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.01,0.22133760452270507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,2,32,power_law_1.2,0.16706559658050538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,power_law_1.01,0.12595200538635254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,2,32,power_law_1.2,0.07328640222549439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.01,0.29747838973999025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,2,32,power_law_1.2,0.1934272050857544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,2,32,power_law_1.2,0.06096000075340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,balanced,0.5705066521962484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,2,32,power_law_1.2,0.2520639896392822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.01,0.34151039123535154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,2,32,power_law_1.2,0.07301120162010193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,power_law_1.01,0.1214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,2,32,power_law_1.2,0.2937536001205444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.01,0.46287999153137205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,2,32,power_law_1.2,0.08027520179748535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,2,32,power_law_1.2,0.31877760887145995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.01,0.6305088043212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,2,32,power_law_1.2,0.08831359744071961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,2,32,power_law_1.2,0.4198272228240967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.01,0.8920255661010742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,2,32,power_law_1.2,0.08744320273399353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,power_law_1.01,0.1260800004005432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,2,32,power_law_1.2,0.0889792025089264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,2,32,power_law_1.2,0.4533952236175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.01,1.13504638671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,2,32,power_law_1.2,0.0882752001285553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,2,32,power_law_1.2,0.6511104106903076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,2,32,power_law_1.2,0.09052799940109253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.01,1.5037247657775878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,power_law_1.01,0.14795520305633544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,2,32,power_law_1.2,0.9238335609436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,2,32,power_law_1.2,0.09409919977188111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.01,2.1879552841186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,2,32,power_law_1.2,0.09723520278930664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,power_law_1.01,0.16779520511627197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,2,32,power_law_1.2,1.5328639984130858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,2,32,power_law_1.2,0.10440319776535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,2,32,power_law_1.2,0.10597759485244751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,2,32,power_law_1.2,2.0776512145996096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.01,4.046425628662109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,balanced,0.7421706517537435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,2,32,power_law_1.2,0.11265920400619507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,power_law_1.01,0.20497279167175292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,2,32,power_law_1.2,2.9732608795166016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,2,32,power_law_1.2,0.131660795211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,power_law_1.01,0.25566079616546633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,2,32,power_law_1.2,0.12250880002975464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,balanced,2.301919937133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,2,32,power_law_1.2,3.9574718475341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,2,32,power_law_1.2,0.14535679817199706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,power_law_1.01,0.34443519115447996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,2,32,power_law_1.2,0.1758015990257263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,power_law_1.01,0.43527679443359374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,2,32,power_law_1.2,0.2295232057571411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,2,32,power_law_1.2,10.317721557617187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,2,32,power_law_1.2,0.2779200077056885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,power_law_1.01,0.6569024085998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,2,32,power_law_1.2,0.33778560161590576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,power_law_1.01,0.8427071571350098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,2,32,power_law_1.2,0.4402624130249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,balanced,2.483018716176351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,2,32,power_law_1.2,0.5724736213684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,power_law_1.01,1.2010432243347169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,2,32,power_law_1.2,0.7753791809082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,2,32,power_law_1.2,1.0895039558410644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,power_law_1.01,1.8145727157592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,2,32,power_law_1.2,1.5012160301208497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,balanced,0.8998613357543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,2,32,power_law_1.2,2.2176319122314454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,power_law_1.01,2.0883199691772463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,2,32,power_law_1.2,4.292153549194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,power_law_1.01,3.6981311798095704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,2,32,power_law_1.2,6.721190643310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,power_law_1.01,6.34911994934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,balanced,1.4223893483479817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,balanced,2.8383092880249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,2,32,power_law_1.2,0.07901440262794494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,2,32,power_law_1.2,0.057126402854919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,2,32,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,2,32,power_law_1.2,0.06346880197525025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,2,32,power_law_1.2,0.0704576015472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,2,32,power_law_1.2,0.08001279830932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,2,32,power_law_1.2,0.08017920255661011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,2,32,power_law_1.2,0.08759040236473084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,2,32,power_law_1.2,0.0871616005897522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,2,32,power_law_1.2,0.09095039963722229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,2,32,power_law_1.2,0.09509119987487794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,2,32,power_law_1.2,0.09812480211257935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,2,32,power_law_1.2,0.10202879905700683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,2,32,power_law_1.2,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,2,32,power_law_1.2,0.13156479597091675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,2,32,power_law_1.2,0.12949119806289672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,2,32,power_law_1.2,0.13787519931793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,2,32,power_law_1.2,0.16720000505447388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,balanced,0.052522664268811546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,2,32,power_law_1.2,0.19671679735183717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,balanced,0.054655998945236206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,balanced,0.04897066454092661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,balanced,0.05947199960549673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,balanced,0.0751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,2,32,power_law_1.2,0.2342911958694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,balanced,0.10870933532714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,balanced,0.04831466575463613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,balanced,0.12576533357302347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,2,32,power_law_1.2,0.2894464015960693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,balanced,0.053770666321118675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,balanced,0.12678933143615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,2,32,power_law_1.2,0.49236478805541994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,balanced,0.05782933533191681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,balanced,0.12779200077056885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.01,0.1109887957572937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,2,32,power_law_1.2,0.5725567817687989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,balanced,0.07922133306662242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,balanced,0.1288159986337026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.01,0.11259520053863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.01,0.07432960271835327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,2,32,power_law_1.2,0.8692607879638672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,balanced,0.08760533730189006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,balanced,0.12845333417256674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.01,0.06670719981193543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,balanced,0.043050666650136314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.01,0.08424320220947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,2,32,power_law_1.2,1.0509247779846191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,balanced,0.12376532951990764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,balanced,0.09038933118184407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.01,0.08638079762458802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,balanced,0.12502933541933695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.01,0.05694079995155334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,balanced,0.09126399954160054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,2,32,power_law_1.2,2.0894144058227537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.01,0.09041919708251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,balanced,0.125082661708196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,balanced,0.09193600217501323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,balanced,0.0452159990866979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.01,0.0665727972984314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,balanced,0.13353066643079123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.01,0.1115839958190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,balanced,0.05656533439954122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,balanced,0.09238400061925252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.01,0.07111039757728577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,2,32,power_law_1.2,2.3656511306762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,balanced,0.13713600238164267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,balanced,0.08106133341789246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,balanced,0.09447466333707173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.01,0.11474560499191284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.01,0.08359040021896362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,balanced,0.08346133430798848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,balanced,0.14486400286356607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,balanced,0.0936906635761261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.01,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.01,0.08535040020942689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,balanced,0.08524266878763835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,2,32,power_law_1.2,3.926310348510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,balanced,0.14230933785438538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,balanced,0.09620799620946248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.01,0.1235967993736267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.01,0.08650239706039428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,balanced,0.08581866820653279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,balanced,0.0974133312702179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,balanced,0.15396266182263693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,balanced,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.01,0.08476160168647766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.01,0.12238080501556396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,2,32,power_law_1.2,5.710412979125977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,balanced,0.10356266299883525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,balanced,0.08735466996828715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.01,0.08951680064201355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,balanced,0.1602026621500651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.01,0.1232640027999878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,power_law_1.01,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,balanced,0.10730133454004924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,balanced,0.0888266662756602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.01,0.09102720022201538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,2,32,power_law_1.2,11.68155517578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.01,0.13043839931488038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,balanced,0.10981866717338562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,balanced,0.18992533286412558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,balanced,0.08953600128491719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,power_law_1.01,0.06793599724769592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.01,0.08974080085754395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.01,0.12807680368423463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,balanced,0.1263146698474884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,balanced,0.09191466371218364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,power_law_1.01,0.05046399831771851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.01,0.09679999947547913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,balanced,0.18798933426539102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.01,0.14069119691848755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,balanced,0.09317866961161296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,balanced,0.13251200318336487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,power_law_1.01,0.06220800280570984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.01,0.09921280145645142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.01,0.14639359712600708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,balanced,0.0995093286037445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,power_law_1.01,0.06865919828414917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,balanced,0.1614720026652018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.01,0.1159168004989624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,balanced,0.2352480093638102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.01,0.15734399557113649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,power_law_1.01,0.07917439937591553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.01,0.12280319929122925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.01,0.16044800281524657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,balanced,0.17221866051355997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,power_law_1.01,0.08346239924430847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.01,0.12152320146560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,balanced,0.244869331518809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.01,0.18529280424118041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,power_law_1.01,0.08593279719352723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,balanced,0.10055999954541524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.01,0.15249919891357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,balanced,0.23332266012827554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.01,0.19584640264511108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,power_law_1.01,0.08492159843444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.01,0.15340800285339357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.01,0.23748478889465333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,power_law_1.01,0.08988159894943237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.01,0.19130239486694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,balanced,0.3717973232269287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,balanced,0.25261332591374713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,power_law_1.01,0.08951680064201355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.01,0.24021759033203124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.01,0.21445760726928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,balanced,0.10833066701889038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,power_law_1.01,0.10043519735336304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.01,0.3079807996749878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.01,0.29706239700317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.01,0.33590400218963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,power_law_1.01,0.10202239751815796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.01,0.35790081024169923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.01,0.487827205657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,power_law_1.01,0.10581760406494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,balanced,0.36186667283376056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,balanced,0.41550934314727783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.01,0.49506559371948244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,power_law_1.01,0.11815680265426635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.01,0.6785024166107178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.01,0.6992703914642334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.01,0.9269632339477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.01,0.9380352020263671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,balanced,0.12052266796429952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.01,1.1453951835632323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,power_law_1.01,0.11887359619140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,balanced,0.4355253378550212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.01,1.2908543586730956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,balanced,0.13147200147310892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.01,1.5552000045776366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.01,1.7320640563964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,balanced,0.5800853172938029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.01,2.2368383407592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,power_law_1.01,0.12435840368270874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.01,2.711257553100586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.01,4.583513641357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.01,4.463801574707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,power_law_1.01,0.14743679761886597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,balanced,0.6410346825917562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,balanced,0.1532639960447947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,power_law_1.01,0.17297919988632202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,16,power_law_1.2,0.09894400238990783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,16,power_law_1.2,0.07969279885292054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,balanced,0.17287999391555786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,16,power_law_1.2,0.07032960057258605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,balanced,0.6899999777475992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,power_law_1.01,0.21444480419158934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,16,power_law_1.2,0.07803519964218139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,power_law_1.01,0.268723201751709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,balanced,0.2358293334643046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,16,power_law_1.2,0.0936191976070404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,power_law_1.01,0.40435199737548827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,16,power_law_1.2,0.12212480306625366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,16,power_law_1.2,0.11300480365753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,power_law_1.01,0.5041344165802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,balanced,0.2902666727701823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,balanced,0.7599413394927979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,16,power_law_1.2,0.11609599590301514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,power_law_1.01,0.711737585067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,16,power_law_1.2,0.1223423957824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,16,power_law_1.2,0.12261120080947877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,power_law_1.01,0.8341504096984863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,16,power_law_1.2,0.12677760124206544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,balanced,0.41473599274953205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,power_law_1.01,1.3162303924560548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,16,power_law_1.2,0.12749439477920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,balanced,0.8494613170623779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,16,power_law_1.2,0.1287616014480591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,16,power_law_1.2,0.14357119798660278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,16,power_law_1.2,0.16058239936828614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,16,power_law_1.2,0.17256319522857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,power_law_1.01,1.9265792846679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,16,power_law_1.2,0.1606335997581482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,balanced,0.5387413501739502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,16,power_law_1.2,0.18800640106201172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,power_law_1.01,2.454694366455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,balanced,0.9391520023345947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,16,power_law_1.2,0.2024319887161255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,16,power_law_1.2,0.26988160610198975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,power_law_1.01,3.2029182434082033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,16,power_law_1.2,0.2977216005325317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,16,power_law_1.2,0.35086081027984617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,power_law_1.01,6.756134033203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,16,power_law_1.2,0.4751039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,balanced,0.7343733310699463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,16,power_law_1.2,0.5910143852233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,16,power_law_1.2,0.7578879833221436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,16,power_law_1.2,1.1536640167236327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,16,power_law_1.2,1.5381695747375488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,balanced,1.2295680046081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,16,power_law_1.2,1.9651840209960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,16,power_law_1.2,3.754457473754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,power_law_1.2,6.782982635498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,balanced,0.9688426653544108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,balanced,1.425989309946696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,balanced,1.182576020558675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,16,power_law_1.2,0.08120959997177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,16,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,16,power_law_1.2,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,16,balanced,2.3956693013509116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,balanced,1.8560907046000164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,16,power_law_1.2,0.06334720253944397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,16,power_law_1.2,0.07101439833641052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,16,power_law_1.2,0.08334720134735107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,16,power_law_1.2,0.08290560245513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,16,power_law_1.2,0.08565120100975036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,16,power_law_1.2,0.08979840278625488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,16,power_law_1.2,0.08796160221099854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,balanced,2.8821493784586587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,16,power_law_1.2,0.09219200015068055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,16,power_law_1.2,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,16,power_law_1.2,0.09770879745483399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,16,power_law_1.2,0.10943360328674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,16,power_law_1.2,0.11481599807739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,16,power_law_1.2,0.12482559680938721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,16,power_law_1.2,0.12737280130386353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,16,power_law_1.2,0.151910400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,16,power_law_1.2,0.15323519706726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,16,power_law_1.2,0.21903998851776124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,16,power_law_1.2,0.2417855978012085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,16,power_law_1.2,0.31675519943237307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,16,power_law_1.2,0.38329598903656004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,16,power_law_1.2,0.5532864093780517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,16,power_law_1.2,0.6989696025848389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,balanced,0.05366399884223938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,16,power_law_1.2,1.1315072059631348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,balanced,0.053770666321118675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,16,power_law_1.2,1.4732799530029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,balanced,0.05962666869163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,16,power_law_1.2,1.6731136322021485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,balanced,0.07584000130494435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,16,power_law_1.2,0.07961599826812744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,balanced,0.1090133289496104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,16,power_law_1.2,2.8081727981567384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,16,power_law_1.2,0.05319039821624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,balanced,3.6975412368774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,balanced,0.12899200121561685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,16,power_law_1.2,0.05135999917984009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,balanced,0.13060800234476724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,16,power_law_1.2,6.440735626220703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,16,power_law_1.2,0.06101120114326477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,balanced,0.1240000029404958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,16,power_law_1.2,0.06540160179138184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,balanced,0.12353600064913432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,16,power_law_1.2,0.07898240089416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,balanced,0.1255626678466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,16,power_law_1.2,0.08365439772605895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,balanced,0.12569066882133484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,16,power_law_1.2,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,balanced,0.1283466617266337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,16,power_law_1.2,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,balanced,0.1295093297958374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,16,power_law_1.2,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,balanced,0.139765332142512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,16,power_law_1.2,0.09431040287017822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,balanced,0.14410133163134256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,16,power_law_1.2,0.09915519952774048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,balanced,0.14706666270891824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,16,power_law_1.2,0.10229120254516602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,balanced,0.149125337600708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,16,power_law_1.2,0.10931839942932128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,balanced,0.16976000865300497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,16,power_law_1.2,0.12275199890136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,balanced,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,balanced,0.17308266957600912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,balanced,0.049125333627065025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,balanced,0.22010666131973267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,balanced,0.050928001602490745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,16,power_law_1.2,0.12629120349884032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,balanced,0.058677335580190025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,balanced,0.2165493369102478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,balanced,0.08103999992211659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,balanced,0.08963200449943542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,16,power_law_1.2,0.13722239732742308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,balanced,0.28969599803288776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,balanced,0.09240000446637471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,balanced,0.09310932954152425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,balanced,0.09407466650009155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,16,power_law_1.2,0.15036159753799438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,balanced,0.304202675819397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,balanced,0.09622933467229207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,16,power_law_1.2,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,balanced,0.09700799981753032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,balanced,0.09700266520182292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,balanced,0.4409173329671224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,16,power_law_1.2,0.26810879707336427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,balanced,0.09993599851926167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,16,power_law_1.2,0.3477952003479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,balanced,0.10084799925486247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,balanced,0.04409599800904592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,16,power_law_1.2,0.4817920207977295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,balanced,0.10869866609573364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,balanced,0.11176000038782756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,balanced,0.04572266836961111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,16,power_law_1.2,0.5972864151000976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,balanced,0.504965345064799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,balanced,0.11777599652608235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,balanced,0.048453330993652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,16,power_law_1.2,0.9684096336364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,balanced,0.059845333298047386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,balanced,0.13970667123794556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,16,power_law_1.2,1.3387392044067383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,balanced,0.08284799754619598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,balanced,0.14573333660761514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,16,power_law_1.2,1.740287971496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,balanced,0.08924266695976257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,balanced,0.18860799074172974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,balanced,0.09130133191744487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,balanced,0.7363359928131104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,16,power_law_1.2,2.213612747192383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,balanced,0.09128533800443013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,balanced,0.19380799929300943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,balanced,0.09277333815892537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,16,power_law_1.2,2.708415985107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,balanced,0.09333866834640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,balanced,0.2646453380584717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,16,power_law_1.2,4.395110321044922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,balanced,0.09565866986910503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,balanced,0.0969546635945638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,balanced,0.10096533099810283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,16,power_law_1.2,12.250572967529298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,balanced,0.3020906647046407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,balanced,0.10289600491523743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,balanced,0.9789493083953857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,balanced,0.11105066537857056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.01,0.07789440155029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,balanced,0.44652267297108966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.01,0.0967423975467682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.01,0.06301440000534057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,balanced,0.11331199606259663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.01,0.07724800109863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.01,0.08967679738998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,balanced,0.542303999265035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.01,0.11126400232315063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.01,0.11468160152435303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,balanced,0.12422399719556172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.01,0.06105599999427795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,balanced,1.0679999987284343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.01,0.11323519945144653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.01,0.06346240043640136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.01,0.1161728024482727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.01,0.05292159914970398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.01,0.11898880004882813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.01,0.062457597255706786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.01,0.12416000366210937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,balanced,0.7751999696095785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.01,0.0709824025630951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.01,0.13008639812469483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.01,0.0812608003616333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.01,0.1370303988456726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,balanced,0.14307733376820883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.01,0.08510720133781433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.01,0.1312064051628113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.01,0.0873856008052826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.01,0.14440959692001343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,balanced,0.15754666924476624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.01,0.0875328004360199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.01,0.15807360410690308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.01,0.09038720130920411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.01,0.16678400039672853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.01,0.09356160163879394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.01,0.1906048059463501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.01,0.09917439818382263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.01,0.20258560180664062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.01,0.10544639825820923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.01,0.2638144016265869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,balanced,0.9832800229390463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.01,0.10393600463867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.01,0.27425920963287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.01,0.11308799982070923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,balanced,0.1966773271560669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.01,0.3236991882324219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.01,0.12126719951629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.01,0.13333120346069335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.01,0.39407360553741455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,balanced,1.7330773671468098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.01,0.1497663974761963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.01,0.5885759830474854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.01,0.16711679697036744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.01,0.7575808048248291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.01,0.21063039302825928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,balanced,0.34913067022959393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.01,0.9956671714782714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.01,0.23367679119110107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.01,1.2955583572387694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.01,0.3042304039001465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.01,1.82043514251709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,balanced,0.4234400192896525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.01,0.3910144090652466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.01,2.576211166381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.01,0.5668799877166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,balanced,1.1723999977111816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.01,0.7014912128448486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.01,4.879616165161133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,8,power_law_1.2,0.07774080038070678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.01,0.9830143928527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,balanced,0.5996053218841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,8,power_law_1.2,0.06287999749183655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.01,1.2969280242919923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,8,power_law_1.2,0.06530560255050659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.01,1.525823974609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,power_law_1.01,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,8,power_law_1.2,0.07578880190849305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.01,2.400070381164551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,8,power_law_1.2,0.08353919982910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,power_law_1.01,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,balanced,0.7817280292510986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,power_law_1.01,0.053311997652053834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,8,power_law_1.2,0.11509120464324951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.01,5.132614517211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,power_law_1.01,0.061766397953033444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,8,power_law_1.2,0.1146880030632019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,power_law_1.01,0.06986240148544312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,8,power_law_1.2,0.11800960302352906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,power_law_1.01,0.08131840229034423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,8,power_law_1.2,0.12268799543380737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,power_law_1.01,0.08574720025062561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,8,power_law_1.2,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,power_law_1.01,0.08614400029182434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,balanced,1.097983996073405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,8,power_law_1.2,0.1382143974304199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,8,power_law_1.2,0.13266559839248657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,power_law_1.01,0.09051520228385926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,balanced,1.8489759763081868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,8,power_law_1.2,0.14417920112609864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,power_law_1.01,0.0921343982219696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,8,power_law_1.2,0.14562560319900514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,8,power_law_1.2,0.14588160514831544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,power_law_1.01,0.0939520001411438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,8,power_law_1.2,0.1529855966567993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,power_law_1.01,0.10875519514083862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,8,power_law_1.2,0.17316479682922364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,power_law_1.01,0.10958720445632934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,8,power_law_1.2,0.19485440254211425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,8,power_law_1.2,0.20670719146728517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,power_law_1.01,0.11523840427398682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,balanced,1.4594507217407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,8,power_law_1.2,0.27871360778808596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,power_law_1.01,0.1272320032119751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,balanced,3.1847572326660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,8,power_law_1.2,0.2827071905136108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,8,power_law_1.2,0.39565439224243165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,power_law_1.01,0.13481600284576417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,8,power_law_1.2,0.45852160453796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,8,power_law_1.2,0.6436607837677002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,power_law_1.01,0.1451840043067932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,8,power_law_1.2,0.9184191703796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,8,power_law_1.2,1.1852416038513183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,power_law_1.01,0.1703935980796814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,8,power_law_1.2,1.843142318725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,power_law_1.01,0.20110719203948973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,balanced,1.787610689798991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,8,power_law_1.2,2.214124870300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,power_law_1.01,0.26175999641418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,8,power_law_1.2,3.460550308227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,power_law_1.01,0.3101759910583496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,power_law_1.01,0.4511807918548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,power_law_1.01,0.6546751976013183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,8,power_law_1.2,6.486073303222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,power_law_1.01,0.9654975891113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,power_law_1.01,1.1097344398498534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,power_law_1.01,1.7102399826049806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,power_law_1.01,2.0938688278198243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,power_law_1.01,2.550860786437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,power_law_1.01,4.696979141235351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,balanced,3.612144152323405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,power_law_1.01,8.747821044921874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,balanced,2.8124586741129556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,8,power_law_1.2,0.06097279787063599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,8,power_law_1.2,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,8,power_law_1.2,0.052236801385879515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,8,power_law_1.2,0.06344959735870362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,8,power_law_1.2,0.0675711989402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,8,power_law_1.2,0.08031359910964966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,8,power_law_1.2,0.08503040075302123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,8,power_law_1.2,0.08791679739952088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,8,power_law_1.2,0.09119359850883484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,8,power_law_1.2,0.0934656023979187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,8,power_law_1.2,0.09684479832649232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,8,power_law_1.2,0.10122879743576049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,8,power_law_1.2,0.1035264015197754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,8,power_law_1.2,0.10603519678115844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,8,power_law_1.2,0.11459840536117553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,8,power_law_1.2,0.12142720222473144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,8,power_law_1.2,0.13714560270309448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,8,power_law_1.2,0.16301440000534057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,8,power_law_1.2,0.16657919883728028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,8,power_law_1.2,0.21512320041656494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,8,power_law_1.2,0.24672000408172606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,8,power_law_1.2,0.3354624032974243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,balanced,5.594693501790364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,8,power_law_1.2,0.4531775951385498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,8,power_law_1.2,0.5995391845703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,8,power_law_1.2,0.769324779510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,8,power_law_1.2,1.466163158416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,8,power_law_1.2,1.5206463813781739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,8,power_law_1.2,1.880473518371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,8,power_law_1.2,2.772204780578613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,8,power_law_1.2,6.042323303222656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,8,power_law_1.2,0.06405760049819946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,8,power_law_1.2,0.052313601970672606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,8,power_law_1.2,0.05066239833831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,balanced,0.05271466573079427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,8,power_law_1.2,0.061337602138519284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,balanced,0.06010666489601135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,8,power_law_1.2,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,balanced,0.06366399923960368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,8,power_law_1.2,0.08270080089569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,balanced,0.08346133430798848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,8,power_law_1.2,0.0855679988861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,balanced,0.1167093316713969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,8,power_law_1.2,0.08997120261192322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,balanced,0.14513066411018372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,balanced,0.047226667404174805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,balanced,0.14755733807881674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,8,power_law_1.2,0.09351680278778077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,balanced,0.05009600023428599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,balanced,0.13499733805656433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,8,power_law_1.2,0.09508479833602905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,balanced,0.05212800204753876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,balanced,0.13526933391888937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,balanced,0.06544533371925354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,8,power_law_1.2,0.10047999620437623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,balanced,0.13660266995429993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,balanced,0.09102400143941243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,balanced,0.13831466436386108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,8,power_law_1.2,0.10428160429000854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,balanced,0.10353599985440572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,balanced,0.14044800400733948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,balanced,0.10751466949780782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,8,power_law_1.2,0.1146880030632019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,balanced,0.14243732889493307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,balanced,0.10249599814414978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,balanced,0.10437867045402527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,8,power_law_1.2,0.12080639600753784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,balanced,0.14819733301798502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,balanced,0.10604799787203471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,8,power_law_1.2,0.1354688048362732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,balanced,0.1067626674969991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,balanced,0.15652267138163248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,balanced,0.10937066872914632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,balanced,0.11020800471305847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,balanced,0.16030399998029074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,balanced,0.11539733409881592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,8,power_law_1.2,0.13960959911346435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,balanced,0.12286933263142903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,balanced,0.16740266482035318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,balanced,0.1253653367360433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,balanced,0.13450666268666586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,balanced,0.2017866571744283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,balanced,0.17064533631006876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,8,power_law_1.2,0.14823039770126342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,balanced,0.17207467555999756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,balanced,0.1988746722539266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,balanced,0.2063200076421102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,8,power_law_1.2,0.18005759716033937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,balanced,0.2648319999376933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,balanced,0.23524266481399536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,8,power_law_1.2,0.21120638847351075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,balanced,0.26770132780075073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,balanced,0.3374240001042684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,8,power_law_1.2,0.30619521141052247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,balanced,0.3855626583099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,8,power_law_1.2,0.35952000617980956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,balanced,0.05075199902057648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,balanced,0.40325868129730225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,8,power_law_1.2,0.5608255863189697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,balanced,0.053632001082102455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,balanced,0.408405343691508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,8,power_law_1.2,0.6136064052581787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,balanced,0.056405335664749146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,balanced,0.0749120016892751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,balanced,0.5958666801452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,8,power_law_1.2,1.061740779876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.01,0.06384639739990235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,balanced,0.09598400195439656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.01,0.06106879711151123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,8,power_law_1.2,1.394559955596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.01,0.0719488024711609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,balanced,0.10169600447018941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,balanced,0.6255573431650797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.01,0.05281280279159546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.01,0.06256639957427979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,balanced,0.10477866729100545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,8,power_law_1.2,1.9562559127807617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,balanced,0.10604799787203471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,balanced,0.7500747044881185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.01,0.0649407982826233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.01,0.07712640166282654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,8,power_law_1.2,2.8372800827026365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,balanced,0.10752532879511516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.01,0.07296000123023987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.01,0.08937600255012512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,balanced,0.10897066195805867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,8,power_law_1.2,3.6197566986083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,balanced,0.7414240042368571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.01,0.09015039801597595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.01,0.1134335994720459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,balanced,0.11212799946467082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.01,0.0998528003692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,balanced,0.11565333604812622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.01,0.1320255994796753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,8,power_law_1.2,6.016678237915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.01,0.09413759708404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,balanced,0.12017599741617839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.01,0.12743040323257446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,balanced,1.1024106343587239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.01,0.0971455991268158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,balanced,0.12627200285593668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.01,0.12681599855422973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,8,power_law_1.2,11.777970886230468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.01,0.10010240077972413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,balanced,0.13555733362833658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.01,0.12963839769363403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.01,0.10376960039138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,balanced,1.0964000225067139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.01,0.13446400165557862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.01,0.10887680053710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.01,0.13841279745101928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.01,0.11318399906158447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,balanced,0.1462399959564209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.01,0.14296319484710693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.01,0.12424319982528687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.01,0.15103360414505004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.01,0.13288320302963258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,balanced,1.3691306114196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.01,0.13921279907226564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.01,0.16930559873580933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.01,0.1486080050468445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.01,0.17662080526351928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,balanced,0.15940800309181213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,balanced,1.344362735748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.01,0.17656960487365722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.01,0.19832320213317872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.01,0.18844159841537475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.01,0.21738240718841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.01,0.23319680690765382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.01,0.23391358852386473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.01,0.27325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.01,0.2881472110748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.01,0.339136004447937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.01,0.36477439403533934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,balanced,0.19901333252588907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,balanced,1.6385812759399414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.01,0.4053311824798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.01,0.4865600109100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,balanced,0.23958933353424072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.01,0.5455359935760498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.01,0.645030403137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,balanced,0.3168639938036601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.01,0.7248447895050049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.01,0.8217280387878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,balanced,1.5877173741658528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.01,0.8851584434509278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,balanced,0.38576531410217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.01,1.2380160331726073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.01,1.3728832244873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.01,1.62609920501709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,balanced,0.5579093297322592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.01,1.7022207260131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.01,1.879654312133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,power_law_1.01,0.0574720025062561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.01,2.097657585144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.01,2.9597631454467774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,power_law_1.01,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,balanced,0.6916053295135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,power_law_1.01,0.0602944016456604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.01,3.3220863342285156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,power_law_1.01,0.07067520022392274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.01,6.542822265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,power_law_1.01,0.07739520072937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,4,power_law_1.2,0.06399359703063964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,power_law_1.01,0.0932096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.01,7.357241821289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,balanced,0.9845759868621826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,power_law_1.01,0.09642879962921143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,4,power_law_1.2,0.06546559929847717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,balanced,2.6144800186157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,power_law_1.01,0.10092159509658813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,4,power_law_1.2,0.06216959953308106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,power_law_1.01,0.10276479721069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,power_law_1.01,0.10909440517425537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,4,power_law_1.2,0.07689599990844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,power_law_1.01,0.11454720497131347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,4,power_law_1.2,0.08241919875144958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,power_law_1.01,0.12629120349884032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,balanced,1.2868320147196453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,4,power_law_1.2,0.11507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,power_law_1.01,0.1336127996444702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,balanced,2.532421271006266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,power_law_1.01,0.1469823956489563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,4,power_law_1.2,0.1226304054260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,power_law_1.01,0.1597440004348755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,4,power_law_1.2,0.12711039781570435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,4,power_law_1.2,0.12558720111846924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,power_law_1.01,0.16701439619064332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,4,power_law_1.2,0.12681599855422973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,balanced,1.8519253730773926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,4,power_law_1.2,0.13861759901046752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,4,power_law_1.2,0.14538240432739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,power_law_1.01,0.18268799781799316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,4,power_law_1.2,0.16090240478515624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,4,power_law_1.2,0.1657088041305542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,4,power_law_1.2,0.17299840450286866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,power_law_1.01,0.2323904037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,power_law_1.01,0.28920319080352785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,4,power_law_1.2,0.18302719593048095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,power_law_1.01,0.3893696069717407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,4,power_law_1.2,0.19645440578460693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,power_law_1.01,0.4802879810333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,balanced,2.4523466428120932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,4,power_law_1.2,0.21735680103302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,power_law_1.01,0.6787007808685303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,4,power_law_1.2,0.2421247959136963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,power_law_1.01,0.8243200302124023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,4,power_law_1.2,0.28984320163726807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,power_law_1.01,1.2242367744445801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,power_law_1.01,1.6375040054321288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,4,power_law_1.2,0.33720319271087645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,power_law_1.01,2.192127990722656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,4,power_law_1.2,0.4599616050720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,power_law_1.01,3.0952320098876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,4,power_law_1.2,0.6487743854522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,power_law_1.01,4.085830307006836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,4,power_law_1.2,0.7630591869354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,4,power_law_1.2,1.013587188720703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,balanced,5.193338712056478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,power_law_1.01,6.093664169311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,balanced,3.005807876586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,4,power_law_1.2,1.4621888160705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,4,power_law_1.2,2.0300928115844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,power_law_1.01,11.123283386230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,4,power_law_1.2,2.2852031707763674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,4,power_law_1.2,3.917567825317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,balanced,4.942111968994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,4,power_law_1.2,7.431526184082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,balanced,4.777562777201335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,4,power_law_1.2,0.05235840082168579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,4,power_law_1.2,0.0529151976108551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,4,power_law_1.2,0.05437440276145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,4,power_law_1.2,0.06198400259017944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,4,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,4,power_law_1.2,0.08579199910163879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,4,power_law_1.2,0.09273599982261657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,4,power_law_1.2,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,4,power_law_1.2,0.09635199904441834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,4,power_law_1.2,0.10392320156097412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,4,power_law_1.2,0.10735360383987427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,4,power_law_1.2,0.11113599538803101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,4,power_law_1.2,0.11783039569854736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,4,power_law_1.2,0.12632319927215577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,4,power_law_1.2,0.1335487961769104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,balanced,9.467274983723959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,4,power_law_1.2,0.14190080165863037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,4,power_law_1.2,0.1556607961654663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,4,power_law_1.2,0.18471039533615113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,4,power_law_1.2,0.19734400510787964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,4,power_law_1.2,0.254367995262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,4,power_law_1.2,0.2949183940887451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,4,power_law_1.2,0.40271358489990233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,balanced,0.05345066885153452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,4,power_law_1.2,0.49061760902404783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,4,power_law_1.2,0.6987840175628662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,balanced,0.05845866600672404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,balanced,0.06898133456707001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,4,power_law_1.2,0.9750399589538574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,balanced,0.09134399890899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,4,power_law_1.2,0.05804160237312317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,balanced,0.12637333075205484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,4,power_law_1.2,1.4692543983459472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,balanced,0.15756266315778097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,4,power_law_1.2,0.05880320072174072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,balanced,0.16077867150306702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,4,power_law_1.2,1.7090560913085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,balanced,0.15029333035151163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,4,power_law_1.2,0.060089600086212155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,balanced,0.15026133259137472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,4,power_law_1.2,2.3949247360229493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,4,power_law_1.2,0.06802560091018676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,balanced,0.1535253326098124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,4,power_law_1.2,0.07394559979438782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,4,power_law_1.2,3.848332977294922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,balanced,0.1567306617895762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,4,power_law_1.2,0.09416959881782531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,balanced,0.15879467129707336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,4,power_law_1.2,0.09786239862442017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,balanced,0.16223999857902527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,4,power_law_1.2,7.657612609863281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,4,power_law_1.2,0.10271999835968018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,balanced,0.16931732495625815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,4,power_law_1.2,0.1074560046195984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,balanced,0.17857599258422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,balanced,0.18582399686177573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,4,power_law_1.2,0.11249279975891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,balanced,0.190175990263621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,4,power_law_1.2,0.12253439426422119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,balanced,0.2670133312543233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,4,power_law_1.2,0.12707200050354003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,balanced,0.2553866704305013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,4,power_law_1.2,0.13563519716262817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,balanced,0.3227199912071228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,4,power_law_1.2,0.15107840299606323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,4,power_law_1.2,0.16563199758529662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,balanced,0.3550399939219157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,balanced,0.5706559816996256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,4,power_law_1.2,0.17937920093536378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,balanced,0.651855985323588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,4,power_law_1.2,0.19178880453109742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,balanced,0.9604159990946451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,4,power_law_1.2,0.23860480785369872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,4,power_law_1.2,0.30371201038360596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,4,power_law_1.2,0.39412479400634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,4,power_law_1.2,0.4728896141052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,balanced,0.049733335773150124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,balanced,1.2200693289438884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,4,power_law_1.2,0.7328832149505615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,balanced,0.05250666538874308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,4,power_law_1.2,0.9176063537597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,balanced,0.05671466886997223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,4,power_law_1.2,1.2847040176391602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,balanced,0.07398933172225952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,balanced,0.10507733623186748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,4,power_law_1.2,1.7768640518188477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.01,0.0686847984790802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,balanced,0.1228000024954478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,4,power_law_1.2,2.578265571594238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.01,0.05082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.01,0.060147202014923094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,balanced,0.12462400396664937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,balanced,1.8415679931640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,4,power_law_1.2,3.467647933959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,balanced,0.1260373294353485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.01,0.06672639846801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,balanced,0.12787200013796488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.01,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.01,0.0795199990272522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,4,power_law_1.2,4.396294403076172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,balanced,0.12988266348838806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.01,0.07026559710502625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.01,0.09494400024414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,balanced,0.1325226624806722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,4,power_law_1.2,7.859897613525391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.01,0.07754240036010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.01,0.1214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,balanced,0.134661336739858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.01,0.10104960203170776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.01,0.13351039886474608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,balanced,0.13938132921854654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.01,0.11129599809646606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.01,0.13805439472198486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,4,power_law_1.2,18.477317810058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,balanced,2.1333972613016763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,balanced,0.1441973348458608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.01,0.11358079910278321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.01,0.13906559944152833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,balanced,0.1527466674645742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.01,0.11851520538330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.01,0.14522240161895753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,balanced,0.17061332861582437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.01,0.1225600004196167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.01,0.15627520084381102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,balanced,0.17320533593495688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.01,0.12976640462875366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.01,0.16168960332870483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,balanced,0.2521653374036153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.01,0.13688960075378417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.01,0.16856319904327394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.01,0.14494719505310058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,balanced,0.22363734245300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.01,0.16666239500045776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.01,0.14905600547790526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.01,0.18520959615707397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,balanced,0.28410667181015015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.01,0.19716479778289794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.01,0.17182079553604127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,balanced,2.603391965230306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,balanced,0.31777065992355347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.01,0.20809600353240967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.01,0.1847551941871643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.01,0.19188480377197265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.01,0.26975359916687014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.01,0.24821760654449462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,balanced,0.4993120034535726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.01,0.28078720569610593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.01,0.24085121154785155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.01,0.3507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.01,0.30840320587158204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.01,0.4136832237243652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,balanced,0.6249013344446818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.01,0.36941440105438234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.01,0.5462080001831054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.01,0.4829247951507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.01,0.6794496059417725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.01,0.6282623767852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,balanced,0.9253599643707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.01,0.9723456382751465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.01,0.9214015960693359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.01,1.2363967895507812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.01,1.274009609222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.01,1.8799936294555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.01,2.1587711334228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.01,1.7721216201782226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,balanced,4.183808008829753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,balanced,1.1934080123901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.01,2.869651222229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.01,2.423411178588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.01,4.702188873291016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.01,2.880633544921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.01,4.63963508605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.01,10.028288269042969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,balanced,1.808303991953532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.01,9.677523040771485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,balanced,2.1266719500223794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,2,power_law_1.2,0.06852480173110961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,balanced,2.6209227244059243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,2,power_law_1.2,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,2,power_law_1.2,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,2,power_law_1.2,0.07781760096549988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,2,power_law_1.2,0.0890175998210907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,balanced,8.606335957845053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,2,power_law_1.2,0.12293119430541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,2,power_law_1.2,0.13070720434188843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,2,power_law_1.2,0.13623039722442626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,2,power_law_1.2,0.14205440282821655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,2,power_law_1.2,0.1465407967567444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,2,power_law_1.2,0.1582527995109558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,2,power_law_1.2,0.16323839426040648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,2,power_law_1.2,0.17233920097351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,2,power_law_1.2,0.1739135980606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,2,power_law_1.2,0.18995840549468995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,2,power_law_1.2,0.19779200553894044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,balanced,4.267482757568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,2,power_law_1.2,0.20955519676208495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,2,power_law_1.2,0.27349119186401366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,2,power_law_1.2,0.2871488094329834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,2,power_law_1.2,0.35847039222717286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,2,power_law_1.2,0.4273856163024902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,2,power_law_1.2,0.5842304229736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,2,power_law_1.2,0.7552832126617431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,2,power_law_1.2,1.0232640266418458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,2,power_law_1.2,1.3940287590026856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,2,power_law_1.2,2.1358335494995115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,2,power_law_1.2,2.424211120605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,2,power_law_1.2,3.0372287750244142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,2,power_law_1.2,0.0510591983795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,2,power_law_1.2,4.941804885864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,2,power_law_1.2,0.05246719717979431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,2,power_law_1.2,0.05586559772491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,2,power_law_1.2,0.06675840020179749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,2,power_law_1.2,10.931295776367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,2,power_law_1.2,0.07720959782600403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,2,power_law_1.2,0.10080640316009522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,2,power_law_1.2,0.10967040061950684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,2,power_law_1.2,0.11746560335159302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,2,power_law_1.2,0.12297600507736206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,2,power_law_1.2,0.12265599966049194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,2,power_law_1.2,0.13184640407562256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,2,power_law_1.2,0.13868160247802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,2,power_law_1.2,0.14899840354919433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,2,power_law_1.2,0.15075199604034423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,2,power_law_1.2,0.1735103964805603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,2,power_law_1.2,0.19028480052948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,2,power_law_1.2,0.19713280200958253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,balanced,8.684207916259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,2,power_law_1.2,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,2,power_law_1.2,0.2538367986679077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,2,power_law_1.2,0.3102848052978516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,2,power_law_1.2,0.38522241115570066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,2,power_law_1.2,0.5014912128448487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,2,power_law_1.2,0.6410431861877441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,2,power_law_1.2,0.9801152229309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,2,power_law_1.2,1.3400639533996581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,2,power_law_1.2,2.0519487380981447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,2,power_law_1.2,2.4819583892822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,2,power_law_1.2,3.350368118286133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,2,power_law_1.2,4.825049591064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,2,power_law_1.2,10.24062728881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,balanced,0.20306666692097983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,balanced,0.12125333150227864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,balanced,0.19612266620000204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,balanced,0.11678399642308553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,balanced,0.1943626602490743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,balanced,0.12054933110872905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,balanced,0.20384534200032553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,balanced,0.124399999777476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,balanced,0.3469546635945638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,balanced,0.21091733376185098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,balanced,0.6672000090281168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,balanced,0.37396268049875897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,balanced,0.9971253077189127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,balanced,0.5388853152592977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,balanced,0.9357333183288574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,balanced,0.5032800038655599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,balanced,0.5002559820810953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,balanced,0.9955999851226807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,balanced,0.5230933427810669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,balanced,0.9540266990661621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,balanced,0.5361440181732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,balanced,0.9948320388793945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,balanced,0.531930685043335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,balanced,0.5340533256530762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,balanced,0.8906613190968832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,balanced,0.5512959957122803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,balanced,1.0185759862263997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,balanced,0.5034186840057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,balanced,1.0151573022206624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,balanced,0.5310773452123007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,balanced,1.0110560258229573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,balanced,0.5265973409016927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,balanced,0.9837813377380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,balanced,0.9591733614603678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,balanced,0.4829813241958618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,balanced,0.9374826749165853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,balanced,0.5357120037078857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,balanced,0.05753066639105479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,balanced,0.932703971862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,balanced,0.05489600201447805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,balanced,0.5739253362019857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,balanced,0.057775999108950295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.9459327697753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,balanced,0.9626560211181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,balanced,0.568554679552714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,balanced,0.06206933160622915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.920684814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,balanced,0.08004799981911977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,balanced,0.9225760300954183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,balanced,0.10214933753013611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.9503935813903809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,balanced,0.5664586623509725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,balanced,0.1330773333708445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.4017216205596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,balanced,0.8468266328175863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,balanced,0.1337440013885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.606547212600708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,balanced,0.563760002454122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,balanced,0.13410666584968567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.747430419921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,balanced,0.1341386636098226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,balanced,0.8339573542277018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,balanced,0.1361120045185089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.7425792217254639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,balanced,0.138154665629069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,balanced,0.5106666485468546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.832153606414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,balanced,0.13967999815940857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.8568960189819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,balanced,0.6500106652577718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,balanced,0.1397546629110972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.8796863555908203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,balanced,0.14759467045466104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,balanced,0.1481706698735555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.8932095527648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,balanced,1.082271973292033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.8860608100891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,balanced,0.15332266688346863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,balanced,1.625205357869466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.8390080451965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,balanced,0.1641973356405894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.9075584411621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.8372927665710449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.8182784080505371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,balanced,0.9624160130818685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.8041088104248046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,balanced,0.17653866608937582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,balanced,1.227669318517049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.7590335845947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.5439680099487305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.8924799919128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.5436480045318604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.01,1.047379207611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.5299776077270508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.01,1.3045632362365722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.23575680255889891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,balanced,1.5632692972819011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.01,1.5960448265075684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.306604790687561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,balanced,0.1957813302675883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,balanced,2.157562732696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.01,1.939686393737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.4163328170776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,balanced,0.21371734142303467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.41984000205993655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.01,2.334726333618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.47545599937438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.01,2.939993667602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,balanced,0.24854934215545654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.45401601791381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.4659264087677002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.01,4.535635375976563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.4520256042480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.01,5.906092834472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.4826687812805176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.4972032070159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,balanced,2.099130630493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.01,8.003008270263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.4836415767669678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,balanced,3.009200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.5020287990570068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.01,12.281484985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.4598976135253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,balanced,0.28809599081675213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,power_law_1.01,0.1319808006286621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.4812032222747803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,power_law_1.01,0.12768640518188476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.4728064060211182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,power_law_1.01,0.12609280347824098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.01,24.218534851074217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.5469888210296631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,power_law_1.01,0.07904000282287597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,balanced,0.35677866141001385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.5931327819824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,power_law_1.01,0.09804800152778625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.6626239776611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,power_law_1.01,0.10238720178604126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,power_law_1.01,0.11322879791259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.8583999633789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,power_law_1.01,0.12316800355911255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,1.0655551910400392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,balanced,0.4586133162180583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,power_law_1.01,0.12273919582366943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,power_law_1.01,0.11473920345306396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,1.3740927696228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,power_law_1.01,0.1328511953353882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,power_law_1.01,0.1389248013496399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,1.6418048858642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,balanced,3.082789421081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,power_law_1.01,0.14035840034484864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,balanced,4.400368054707845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,2.6018112182617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,power_law_1.01,0.1503999948501587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,power_law_1.01,0.15332479476928712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,balanced,0.6086133321126302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,3.0508800506591798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,power_law_1.01,0.16723840236663817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.969593620300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,power_law_1.01,0.1838528037071228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.5394879817962647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.01,4.216985702514648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.9472512245178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,power_law_1.01,0.20979840755462648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.9475647926330566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.5386816024780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.01,7.163308715820312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.4094719886779785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.4981376171112061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.6486080169677735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.01,0.233459210395813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.28476800918579104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.6170239925384522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.01,14.608198547363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.30938880443572997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.7359424114227295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.3286207914352417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.01,0.26423680782318115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.8166975975036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.3414144039154053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.01,0.29266560077667236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.8449088096618652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.42880001068115237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.01,0.39426560401916505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,balanced,0.8297066688537598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.7265215873718261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.4810175895690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.8174847602844239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.44614400863647463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.45656957626342776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.01,0.4570943832397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.7813504219055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.46316161155700686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.01,0.6531519889831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.8561280250549317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.47292799949645997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.9274496078491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.01,0.860921573638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.46282238960266114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.8955264091491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.01,1.2828160285949708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.4924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.7835072040557861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.4988096237182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.8224255561828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.01,1.7639167785644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.44846720695495607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.9264320373535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,64,power_law_1.2,1.0472576141357421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.499238395690918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,64,power_law_1.2,1.146406364440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.5596672058105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,balanced,1.0261120001475017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,64,power_law_1.2,1.4933695793151855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,power_law_1.01,2.245408058166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.628115177154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.8229311943054199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,64,power_law_1.2,2.1317375183105467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,power_law_1.01,3.2761985778808596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,balanced,7.627648035685222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,1.0459839820861816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,balanced,5.54582405090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,64,power_law_1.2,2.215398406982422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,1.319059181213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,power_law_1.01,6.9439231872558596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,64,power_law_1.2,3.2153343200683593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,1.8
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,64,power_law_1.2,3.949919891357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,2.3862079620361327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,64,power_law_1.2,7.640876770019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,3.4594047546386717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,4.545062255859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,64,power_law_1.2,9.031027221679688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,64,power_law_1.2,6.344211196899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,64,power_law_1.2,10.553043365478516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,64,power_law_1.2,9.504422760009765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,balanced,1.5896107355753581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,64,power_law_1.2,19.644415283203124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,64,power_law_1.2,21.500090026855467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,64,power_law_1.2,41.01347351074219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,balanced,3.1317227681477866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,64,power_law_1.2,0.13052799701690673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,64,power_law_1.2,0.12643840312957763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,64,power_law_1.2,0.12562559843063353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,64,power_law_1.2,0.081740802526474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,64,power_law_1.2,0.08554239869117737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,64,power_law_1.2,0.10981119871139526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,64,power_law_1.2,0.10919040441513062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,64,power_law_1.2,0.12595839500427247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,64,power_law_1.2,0.1322111964225769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,balanced,0.11886399984359741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,64,power_law_1.2,0.12727680206298828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,64,power_law_1.2,0.1285375952720642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,balanced,0.11620266238848369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,64,power_law_1.2,0.13068159818649291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,balanced,0.12249599893887837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,64,power_law_1.2,0.13020800352096557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,balanced,0.20057066281636557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,64,power_law_1.2,0.1430848002433777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,balanced,0.3675040006637573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,64,power_law_1.2,0.16243200302124022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,balanced,0.6834186712900797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,balanced,0.9990932941436768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,64,power_law_1.2,0.17148159742355346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,balanced,0.9802453517913818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,64,power_law_1.2,0.1855039954185486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,balanced,0.9977813561757406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,64,power_law_1.2,0.22648320198059083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,balanced,0.9906346797943115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,balanced,0.9430560270945231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,balanced,0.9529173374176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.2,0.2702080011367798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,balanced,0.9398399988810221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,balanced,0.9342453479766846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.2,0.2618367910385132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,balanced,0.9335467020670573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.2,0.3656831979751587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,balanced,0.9258666833241781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.2,0.50862717628479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,balanced,0.07815999786059062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,balanced,0.9687360127766927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,balanced,0.9876213073730469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,balanced,0.0805866668621699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,balanced,0.07974400122960408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.2,0.561190414428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,balanced,0.9651093482971191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,balanced,0.13371200362841287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.2,0.8998784065246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,balanced,0.22674665848414102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,balanced,0.9221599896748861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.2,1.0463359832763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,balanced,0.3836746613184611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.2,1.6999679565429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,balanced,0.54585067431132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,balanced,0.9432319800059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,balanced,0.5315466721852621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.2,2.339743995666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,balanced,0.5354186693827311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,balanced,0.92413330078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.01,0.7105408191680909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,balanced,0.5351200103759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,balanced,0.5788533290227255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,64,power_law_1.2,2.9226879119873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.01,1.0247424125671387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,balanced,0.5655306577682495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,balanced,0.8577866554260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,64,power_law_1.2,4.314323043823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,balanced,0.5370560089747111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.01,1.026144027709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,balanced,0.5479840040206909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.01,0.3231935977935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,64,power_law_1.2,10.361209869384766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,balanced,0.5196533203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,balanced,0.6992853482564291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,balanced,0.5100533167521158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.01,0.4816256046295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.01,0.39045760631561277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,balanced,0.047210668524106346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,balanced,0.5099039872487386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.01,0.6385536193847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.01,0.5477568149566651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,balanced,0.0476800004641215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,balanced,0.501039981842041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.01,0.6845056056976319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.01,0.5499199867248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,balanced,0.04799466828505198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,balanced,1.677135944366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,balanced,0.604634682337443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,balanced,0.06189866860707601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.01,0.8362431526184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.01,0.18748799562454224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,balanced,0.08027733365694682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,balanced,0.5637653271357218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.01,0.2695807933807373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.01,0.8550271987915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,balanced,0.10458667079607646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.01,0.3349695920944214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,balanced,0.13335466384887695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.01,0.7879487991333007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,balanced,0.581717332204183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,balanced,0.1357439955075582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.01,0.3324608087539673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.01,0.8291520118713379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,balanced,0.13609066605567932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.01,0.40274558067321775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.01,0.8621055603027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,balanced,0.1359946628411611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,balanced,1.3357547124226887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,balanced,0.6182986497879028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.01,0.4261760234832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,balanced,0.1381600002447764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.01,0.8220735549926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.01,0.4389503955841064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,balanced,0.1399679978688558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.01,0.8694975852966309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.01,0.4808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,balanced,0.5818826754887899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,balanced,0.14134400089581808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.01,0.4266687870025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,power_law_1.01,0.11411839723587036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.01,0.888038444519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,balanced,0.14266666769981384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.01,0.45469441413879397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,power_law_1.01,0.13224320411682128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.01,0.887116813659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.01,0.44776320457458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,balanced,0.1502240002155304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.01,0.7926527976989746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,balanced,0.5532533327738444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.01,0.4784063816070557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,power_law_1.01,0.12794239521026612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,balanced,0.1514400045077006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.01,0.4877312183380127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,balanced,2.2932106653849282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,balanced,0.15772266189257303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.01,0.8957183837890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.01,0.4761536121368408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,power_law_1.01,0.07493759989738465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,balanced,0.1695680022239685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.01,0.8973183631896973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.01,0.49409918785095214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.01,0.5284480094909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,power_law_1.01,0.08023679852485657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.01,1.117420768737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,balanced,1.1084213256835938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.01,0.5432831764221191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.01,1.178816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.01,0.6384895801544189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,power_law_1.01,0.09290239810943604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.01,1.376147174835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.01,0.8157695770263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,balanced,0.18406933546066284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,power_law_1.01,0.10059520006179809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.01,1.6525184631347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.01,0.9163135528564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.01,2.2500415802001954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.01,1.2577664375305175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,power_law_1.01,0.11701120138168335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,balanced,3.198063850402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,balanced,1.0380853017171223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.01,2.7369663238525392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.01,1.486969566345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,power_law_1.01,0.12060799598693847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.01,2.1997312545776366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,power_law_1.01,0.12506879568099977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.01,3.7417343139648436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,power_law_1.01,0.12640000581741334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.01,2.8486656188964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,32,power_law_1.2,0.6916096210479736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,power_law_1.01,0.13267199993133544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,balanced,0.204367995262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.01,5.009132766723633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.01,3.2970367431640626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,32,power_law_1.2,0.985478401184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,power_law_1.01,0.13502720594406128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,balanced,0.22585066159566244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.01,5.637772750854492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,32,power_law_1.2,0.9346943855285644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,power_law_1.01,0.13458559513092042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.01,5.598438262939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,32,power_law_1.2,0.31549439430236814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,power_law_1.01,0.15047039985656738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,balanced,1.6407999992370605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,balanced,0.26637866099675495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.01,9.474342346191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,32,power_law_1.2,0.39486079216003417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,power_law_1.01,0.16227840185165404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.01,11.063744354248048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,power_law_1.01,0.18409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,32,power_law_1.2,0.562336015701294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,power_law_1.01,0.20173439979553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,32,power_law_1.2,0.5751488208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.01,17.634994506835938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,32,power_law_1.2,0.7420671939849853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,32,power_law_1.2,0.8004608154296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,balanced,4.6747894287109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,power_law_1.01,0.2270143985748291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,32,power_law_1.2,0.7920576095581054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,32,power_law_1.2,0.7395199775695801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,balanced,0.31518399715423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,power_law_1.01,0.23678081035614013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,balanced,2.213146686553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,32,power_law_1.2,0.8678272247314454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,power_law_1.01,0.2915263891220093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,32,power_law_1.2,0.7401343822479248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,power_law_1.01,0.3987519979476929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,balanced,0.3994773228963216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,32,power_law_1.2,0.8272576332092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,32,power_law_1.2,0.7781439781188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,32,power_law_1.2,0.8282431602478028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,power_law_1.01,0.49660158157348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,32,power_law_1.2,0.8433216094970704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,power_law_1.01,0.66494722366333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,32,power_law_1.2,0.9353919982910156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,32,power_law_1.2,0.9644031524658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,balanced,0.5332266489664713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,power_law_1.01,0.8765312194824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,32,power_law_1.2,1.166368007659912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,power_law_1.01,1.1867072105407714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,32,power_law_1.2,1.3068544387817382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,32,power_law_1.2,1.6285568237304688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,balanced,3.2999305725097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,32,power_law_1.2,2.0613311767578124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,32,power_law_1.2,2.399942398071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,power_law_1.01,1.6776384353637694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,balanced,0.7131573359171549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,32,power_law_1.2,3.031295967102051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,power_law_1.01,2.065113639831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,32,power_law_1.2,4.734854507446289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,power_law_1.01,2.8056896209716795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,32,power_law_1.2,6.522502136230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,32,power_law_1.2,7.5921791076660154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,power_law_1.01,6.008172988891602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,balanced,8.012309392293295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,32,power_law_1.2,13.454931640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,balanced,0.9636693000793457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,32,power_law_1.2,24.852230834960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,balanced,1.1841386953989665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,32,power_law_1.2,0.38840320110321047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,32,power_law_1.2,0.5467904090881348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,32,power_law_1.2,0.5196159839630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,32,power_law_1.2,0.1937343955039978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,32,power_law_1.2,0.31363840103149415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,balanced,5.870992024739583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,32,power_law_1.2,0.29410560131073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,32,power_law_1.2,0.34872961044311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,32,power_law_1.2,0.3961087942123413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,32,power_law_1.2,0.37907838821411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,32,power_law_1.2,0.43415040969848634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,balanced,1.8404693603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,32,power_law_1.2,0.4061439990997314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,32,power_law_1.2,0.454911994934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,32,power_law_1.2,0.4650047779083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,32,power_law_1.2,0.450380802154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,32,power_law_1.2,0.48439679145812986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,32,power_law_1.2,0.4526336193084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,32,power_law_1.2,0.48192639350891114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,32,power_law_1.2,0.5099904060363769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,32,power_law_1.2,0.5446335792541503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,32,power_law_1.2,0.6427711963653564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,32,power_law_1.2,0.7557824134826661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,32,power_law_1.2,0.960211181640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,32,power_law_1.2,1.1049280166625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,32,power_law_1.2,1.5442943572998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,32,power_law_1.2,1.9407360076904296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,32,power_law_1.2,2.8991935729980467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,32,power_law_1.2,3.6595073699951173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,balanced,0.06006933252016703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,32,power_law_1.2,4.4446464538574215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,balanced,0.05834133426348368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,balanced,0.06287999947865804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,balanced,3.6293280919392905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,32,power_law_1.2,7.970611572265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,balanced,0.07631466786066692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,balanced,0.10514133175214131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,32,power_law_1.2,0.10496640205383301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,balanced,0.1614720026652018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,balanced,0.21851734320322672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,32,power_law_1.2,0.13333120346069335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,32,power_law_1.2,15.154042053222657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,balanced,0.22069867451985678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,32,power_law_1.2,0.12353279590606689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,balanced,0.2200053334236145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,balanced,0.22121065855026245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,32,power_law_1.2,0.06718720197677612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,balanced,0.2226240038871765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,32,power_law_1.2,0.08073599934577942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,balanced,0.22002132733662924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,32,power_law_1.2,0.08657280206680298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,balanced,0.22593067089716592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,balanced,0.228602667649587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,32,power_law_1.2,0.09553279876708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,balanced,0.23247466484705606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,32,power_law_1.2,0.11432960033416747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,balanced,0.23906666040420532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,32,power_law_1.2,0.11500799655914307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,balanced,0.23841599623362222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,32,power_law_1.2,0.11835520267486573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,balanced,0.24759467442830405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,32,power_law_1.2,0.1229375958442688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,balanced,0.2658453385035197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,32,power_law_1.2,0.1314303994178772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,balanced,0.28773866097132367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,32,power_law_1.2,0.14071040153503417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,32,power_law_1.2,0.13883520364761354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,balanced,0.30959999561309814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,32,power_law_1.2,0.14985599517822265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,32,power_law_1.2,0.165721595287323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,balanced,0.34669331709543866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,32,power_law_1.2,0.1737920045852661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,32,power_law_1.2,0.22585599422454833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,balanced,0.3983786503473918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,32,power_law_1.2,0.24803199768066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,balanced,0.47814400990804035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,balanced,0.04906666775544485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,32,power_law_1.2,0.26793599128723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,32,power_law_1.2,0.36627840995788574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.01,0.11234560012817382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,balanced,0.04958933095137278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,balanced,0.5756853421529134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,32,power_law_1.2,0.461740779876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,balanced,0.05638933181762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.01,0.15523200035095214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,balanced,0.060032000144322716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.01,0.21093759536743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,balanced,0.07879999776681264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,32,power_law_1.2,0.5914432048797608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.01,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,balanced,0.10659199953079224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,32,power_law_1.2,0.798201608657837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,balanced,0.13796266913414001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.01,0.10822399854660034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,balanced,0.0484799991051356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,balanced,0.13943466544151306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,balanced,0.7305866877237955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,32,power_law_1.2,1.032089614868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,balanced,0.049098665515581764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.01,0.14434560537338256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,balanced,0.14032533764839172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,balanced,0.1414346694946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,balanced,0.05117866893609365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,32,power_law_1.2,1.65283203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.01,0.14321919679641723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,balanced,0.06062933305899302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,balanced,0.14317333698272705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.01,0.1738368034362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,32,power_law_1.2,2.093894386291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,balanced,0.07778133451938629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,balanced,0.1452959974606832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.01,0.17786879539489747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.01,0.07663999795913697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,balanced,0.10564800103505452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,balanced,0.1479520003000895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,32,power_law_1.2,2.490963172912598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,balanced,0.13820800185203552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.01,0.17861759662628174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,balanced,0.149807999531428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.01,0.10191999673843384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,32,power_law_1.2,4.235903930664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,balanced,0.13922133048375449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,balanced,0.9328266779581705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,balanced,0.15760533014933267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.01,0.17805440425872804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.01,0.13067519664764404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,balanced,0.13990400234858194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,balanced,0.15918933351834616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.01,0.18271360397338868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,32,power_law_1.2,10.686476898193359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.01,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,balanced,0.1399999956289927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,balanced,0.16613866885503134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.01,0.19244799613952637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,balanced,0.14249599973360697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.01,0.08041599988937378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,balanced,0.18134933710098267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,balanced,0.14506133397420248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.01,0.1901311993598938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.01,0.10255359411239624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,balanced,0.14696000019709268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,balanced,0.19490132729212442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.01,0.20743680000305176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.01,0.10398080348968505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,balanced,0.1492906709512075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.01,0.12039680480957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.01,0.21434240341186522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,balanced,0.2226453423500061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,balanced,0.15761066476504007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.01,0.11345920562744141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.01,0.22525439262390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,balanced,0.2548373341560364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,balanced,1.114367961883545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,balanced,0.15965867042541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.01,0.12033280134201049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.01,0.24528639316558837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,balanced,0.16636266311009726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.01,0.27368960380554197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.01,0.12284159660339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,balanced,0.30744000275929767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,balanced,0.18120533227920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.01,0.3309119939804077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.01,0.12967679500579835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.01,0.13416320085525513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.01,0.3631040096282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,balanced,0.3587840000788371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.01,0.13523199558258056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.01,0.4599743843078613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,balanced,0.20140800873438516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.01,0.14287999868392945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.01,0.4916863918304443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,balanced,0.4606613318125407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.01,0.14718079566955566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.01,0.5897856235504151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.01,0.16503679752349854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.01,0.18455040454864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.01,0.7755839824676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.01,0.19833600521087646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.01,1.0089216232299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,balanced,0.5840266545613607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.01,0.239084792137146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,balanced,0.22923733790715536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.01,1.2156031608581543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,balanced,1.6809333165486653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.01,0.2716991901397705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,balanced,0.25819732745488483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.01,0.3475136041641235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.01,1.506713581085205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.01,0.4221759796142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,balanced,0.3158559997876485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.01,2.508755111694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.01,0.5329919815063476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,balanced,0.7991360028584799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.01,0.7001855850219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.01,4.743110275268554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.01,0.9662655830383301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.01,1.2331839561462403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,power_law_1.01,0.0837440013885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.01,1.5813887596130372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,power_law_1.01,0.10828160047531128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,balanced,0.39636798699696857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.01,2.4107839584350588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,power_law_1.01,0.13738240003585817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,balanced,1.0265440146128337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,power_law_1.01,0.06707199811935424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.01,4.618297576904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,balanced,0.5152000188827515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,power_law_1.01,0.08454399704933166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,power_law_1.01,0.08751360177993775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,power_law_1.01,0.09966719746589661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,balanced,0.6832106908162435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,power_law_1.01,0.11827839612960815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,power_law_1.01,0.12540160417556762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,power_law_1.01,0.1263360023498535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,balanced,1.2434133688608806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,16,power_law_1.2,0.11313920021057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,power_law_1.01,0.12722560167312622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,16,power_law_1.2,0.15716480016708373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,power_law_1.01,0.13386240005493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,balanced,0.9229280153910319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,16,power_law_1.2,0.13800959587097167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,power_law_1.01,0.13207039833068848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,power_law_1.01,0.14613759517669678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,16,power_law_1.2,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,balanced,3.1542879740397134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,power_law_1.01,0.1478656053543091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,16,power_law_1.2,0.10229760408401489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,power_law_1.01,0.16013439893722534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,16,power_law_1.2,0.12572799921035765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,power_law_1.01,0.175654399394989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,16,power_law_1.2,0.13924479484558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,power_law_1.01,0.20765440464019774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,16,power_law_1.2,0.16876800060272218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,16,power_law_1.2,0.17249280214309692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,power_law_1.01,0.22485120296478273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,16,power_law_1.2,0.16841599941253663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,balanced,1.2536906401316326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,balanced,1.9242933591206868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,16,power_law_1.2,0.1696768045425415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,16,power_law_1.2,0.17935359477996826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,power_law_1.01,0.25515520572662354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,16,power_law_1.2,0.19338879585266114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,power_law_1.01,0.3328448057174683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,16,power_law_1.2,0.2000511884689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,power_law_1.01,0.4109951972961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,16,power_law_1.2,0.2200256109237671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,16,power_law_1.2,0.23230719566345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,power_law_1.01,0.5505472183227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,16,power_law_1.2,0.2320768117904663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,balanced,1.5377813975016277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,power_law_1.01,0.7246528148651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,16,power_law_1.2,0.25673599243164064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,power_law_1.01,0.9373503684997558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,16,power_law_1.2,0.2922111988067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,16,power_law_1.2,0.3467008113861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,power_law_1.01,1.4463232040405274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,16,power_law_1.2,0.41045122146606444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,16,power_law_1.2,0.5242815971374511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,power_law_1.01,1.9004352569580079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,16,power_law_1.2,0.507257604598999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,power_law_1.01,2.149510383605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,16,power_law_1.2,0.6666240215301513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,power_law_1.01,3.795328140258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,16,power_law_1.2,0.8193280220031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,16,power_law_1.2,1.1466496467590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,power_law_1.01,6.894521331787109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,16,power_law_1.2,1.4895551681518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,balanced,2.407599925994873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,16,power_law_1.2,1.9433855056762694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,16,power_law_1.2,0.07574399709701538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,16,power_law_1.2,2.663667106628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,16,power_law_1.2,0.10550400018692016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,16,power_law_1.2,0.09120000004768372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,16,power_law_1.2,5.584716796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,balanced,3.722618738810221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,16,power_law_1.2,0.06500480175018311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,16,power_law_1.2,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,16,power_law_1.2,0.09055359959602356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,16,power_law_1.2,0.09112319946289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,16,power_law_1.2,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,16,power_law_1.2,0.11012480258941651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,16,power_law_1.2,0.11448960304260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,16,power_law_1.2,0.12758400440216064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,16,power_law_1.2,0.12945280075073243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,16,power_law_1.2,0.12855679988861085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,16,power_law_1.2,0.13318400382995604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,16,power_law_1.2,0.14387840032577515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,16,power_law_1.2,0.15665919780731202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,16,power_law_1.2,0.16635520458221437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,16,power_law_1.2,0.20100479125976561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,16,power_law_1.2,0.2169408082962036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,16,power_law_1.2,0.25861120223999023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,16,power_law_1.2,0.29539198875427247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,16,power_law_1.2,0.373036789894104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,16,power_law_1.2,0.4331071853637695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,16,power_law_1.2,0.6164991855621338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,16,power_law_1.2,0.7417407989501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,16,power_law_1.2,1.0981311798095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,balanced,4.7328745524088545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,16,power_law_1.2,1.3849216461181642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,16,power_law_1.2,1.7375360488891602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,16,power_law_1.2,2.809651184082031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,16,power_law_1.2,0.07934079766273498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,16,power_law_1.2,5.906393432617188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,16,power_law_1.2,0.1080896019935608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,balanced,0.056890666484832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,16,power_law_1.2,0.09797760248184204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,balanced,0.055861334005991616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,balanced,0.06241600215435028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,16,power_law_1.2,0.06673280000686646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,balanced,0.07645866771539052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,16,power_law_1.2,0.07277439832687378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,balanced,0.10785067081451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,balanced,0.16527466972668967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,16,power_law_1.2,0.09602559804916382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,balanced,0.2249600092569987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,16,power_law_1.2,0.09265919923782348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,balanced,0.22522666056950888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,16,power_law_1.2,0.11951359510421752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,balanced,0.22619734207789102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,16,power_law_1.2,0.11353600025177002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,balanced,0.22588266928990683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,balanced,0.22642666101455688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,16,power_law_1.2,0.11320960521697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,balanced,0.23067200183868408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,16,power_law_1.2,0.1258239984512329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,balanced,0.224506676197052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,balanced,0.23414399226506552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,16,power_law_1.2,0.1324288010597229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,balanced,0.23577600717544556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,16,power_law_1.2,0.1343808054924011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,balanced,0.24754132827123007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,balanced,0.25170665979385376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,balanced,0.04884799818197886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,16,power_law_1.2,0.14253439903259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,balanced,0.269381324450175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,balanced,0.04939733445644379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,16,power_law_1.2,0.15399680137634278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,balanced,0.2783199946085612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,16,power_law_1.2,0.16042239665985109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,balanced,0.06200533111890157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,balanced,0.30560533205668133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,16,power_law_1.2,0.18322559595108032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,balanced,0.07957866787910461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,balanced,0.11312533418337505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,balanced,0.34307201703389484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,16,power_law_1.2,0.214630389213562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,balanced,0.1448853313922882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,balanced,0.1453546682993571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,balanced,0.4028693437576294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,balanced,0.14519466956456503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,16,power_law_1.2,0.2532927989959717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,balanced,0.1480959951877594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,balanced,0.44669334093729657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,balanced,0.1490720013777415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,balanced,0.1506186624368032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,16,power_law_1.2,0.27781119346618655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,balanced,0.15458133816719055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,balanced,0.5644960006078085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,16,power_law_1.2,0.3526079893112183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,balanced,0.15779200196266174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,16,power_law_1.2,0.4666304111480713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,balanced,0.16671999295552573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,16,power_law_1.2,0.6158527851104736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,balanced,0.1695093313852946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,balanced,0.6892746289571127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,16,power_law_1.2,0.833619213104248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,balanced,0.17803732554117838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,16,power_law_1.2,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,balanced,0.19594667355219522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,16,power_law_1.2,1.682156753540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,balanced,0.21356266736984253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,balanced,0.9173973401387533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,balanced,0.2490239938100179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,16,power_law_1.2,2.2117759704589846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,16,power_law_1.2,2.5663808822631835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,balanced,0.2834346691767375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,16,power_law_1.2,5.237900924682617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,balanced,0.34335466225941974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,balanced,0.05237866441408793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,16,power_law_1.2,9.118029022216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,balanced,0.41359468301137287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,balanced,0.05550933380921682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,balanced,1.2014666398366292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,balanced,0.058746665716171265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.01,0.07819520235061646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,balanced,0.07134933272997539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,balanced,0.08941333492596944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.01,0.10836479663848878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,balanced,0.5470399856567383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,balanced,0.11619200309117635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.01,0.1534335970878601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,balanced,0.15034133195877075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,balanced,0.15169599652290344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.01,0.07651200294494628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,balanced,0.15397333105405173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.01,0.09886720180511474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,balanced,0.15333867073059082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,balanced,0.6914400259653727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.01,0.12276480197906495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,balanced,0.15585066874821982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,balanced,1.5290346145629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.01,0.06053119897842407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,balanced,0.15875200430552164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.01,0.1424512028694153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,balanced,0.16237333416938782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.01,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.01,0.15738879442214965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,balanced,0.1669493317604065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.01,0.1026304006576538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.01,0.15815039873123168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,balanced,0.1767786741256714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,balanced,0.9747573534647623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.01,0.06216959953308106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,balanced,0.17803732554117838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.01,0.1719231963157654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.01,0.0780672013759613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,balanced,0.1922559936841329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.01,0.18135039806365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.01,0.08982399702072144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,balanced,0.21200533707936606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.01,0.17734400033950806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.01,0.09887359738349914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.01,0.1944383978843689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.01,0.1122048020362854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.01,0.20097920894622803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.01,0.11672320365905761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.01,0.2210304021835327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.01,0.121452796459198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,balanced,0.23732266823450723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,balanced,1.2469120025634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.01,0.13035520315170288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.01,0.23042559623718262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,balanced,2.1166346867879233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.01,0.12798080444335938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.01,0.23045759201049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.01,0.13664000034332274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.01,0.2632895946502686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,power_law_1.01,0.07308800220489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.01,0.29051520824432375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.01,0.1451647996902466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,balanced,0.3015039960543315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.01,0.33394560813903806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.01,0.15700479745864868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,power_law_1.01,0.08631680011749268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.01,0.16430720090866088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,power_law_1.01,0.12021119594573974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,balanced,0.3577760060628255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.01,0.36193280220031737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.01,0.18187520503997803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,power_law_1.01,0.07153279781341552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,8,power_law_1.2,0.07831040024757385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,balanced,1.5563626289367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.01,0.45137920379638674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.01,0.20762240886688232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,power_law_1.01,0.0840448021888733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,8,power_law_1.2,0.10461440086364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,balanced,0.43886931737263996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.01,0.5197440147399902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,8,power_law_1.2,0.09662719964981079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.01,0.22111361026763915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,power_law_1.01,0.0972544014453888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.01,0.7427519798278809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,8,power_law_1.2,0.07534080147743225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.01,0.26338560581207277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,power_law_1.01,0.10945919752120972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,8,power_law_1.2,0.09763200283050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.01,0.9072896003723144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.01,0.2949887990951538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,power_law_1.01,0.12536319494247436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,8,power_law_1.2,0.11354880332946778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,8,power_law_1.2,0.1355520009994507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.01,0.37091200351715087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,power_law_1.01,0.12922879457473754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.01,1.2066368103027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,balanced,0.5611573457717896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,8,power_law_1.2,0.1504639983177185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,power_law_1.01,0.13174400329589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.01,0.4667520046234131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.01,1.4941760063171388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,8,power_law_1.2,0.16320639848709106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,power_law_1.01,0.14165120124816893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.01,0.61976318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,8,power_law_1.2,0.15763839483261108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.01,1.8394880294799805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,8,power_law_1.2,0.17486079931259155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,power_law_1.01,0.14433280229568482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.01,0.8113151550292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,balanced,0.7358880043029785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,8,power_law_1.2,0.17760640382766724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.01,2.5705535888671873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,power_law_1.01,0.1518720030784607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.01,1.1243840217590333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,8,power_law_1.2,0.18451199531555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,power_law_1.01,0.15975040197372437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,8,power_law_1.2,0.19534720182418824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.01,1.5060992240905762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.01,5.353350448608398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,8,power_law_1.2,0.2150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,power_law_1.01,0.17238399982452393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,balanced,2.345658620198568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.01,1.8050880432128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,8,power_law_1.2,0.23089280128479003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,balanced,1.0094986756642659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,power_law_1.01,0.18201600313186644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,8,power_law_1.2,0.2435391902923584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,power_law_1.01,0.200927996635437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,8,power_law_1.2,0.29845759868621824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.01,2.8251583099365236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,8,power_law_1.2,0.29701120853424073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,power_law_1.01,0.24433279037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,8,power_law_1.2,0.35086081027984617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.01,5.808012771606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,8,power_law_1.2,0.3817408084869385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,balanced,4.106874783833821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,8,power_law_1.2,0.5054143905639649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,power_law_1.01,0.27742719650268555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,balanced,1.3797760009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,8,power_law_1.2,0.6065792083740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,8,power_law_1.2,0.8346688270568847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,power_law_1.01,0.3395136117935181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,8,power_law_1.2,0.9798015594482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,power_law_1.01,0.413804817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,8,power_law_1.2,1.425011157989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,power_law_1.01,0.548095989227295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,8,power_law_1.2,1.6844160079956054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,balanced,1.8392267227172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,8,power_law_1.2,2.130739212036133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,power_law_1.01,0.6933119773864747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,power_law_1.01,0.9475263595581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,8,power_law_1.2,3.3196033477783202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,power_law_1.01,1.2785792350769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,power_law_1.01,1.8557695388793944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,8,power_law_1.2,5.514905548095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,power_law_1.01,2.29935359954834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,power_law_1.01,2.7944063186645507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,power_law_1.01,4.7157440185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,balanced,2.277989387512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,power_law_1.01,9.686278533935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,balanced,4.573871930440267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,8,power_law_1.2,0.06095359921455383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,8,power_law_1.2,0.0728767991065979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,8,power_law_1.2,0.07351679801940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,8,power_law_1.2,0.06282879710197449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,balanced,3.557685216267904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,8,power_law_1.2,0.07283200025558471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,8,power_law_1.2,0.08577280044555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,8,power_law_1.2,0.09353600144386291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,8,power_law_1.2,0.11548800468444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,8,power_law_1.2,0.11415040493011475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,8,power_law_1.2,0.1215999960899353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,8,power_law_1.2,0.12494080066680908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,8,power_law_1.2,0.13122559785842897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,8,power_law_1.2,0.13678719997406005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,8,power_law_1.2,0.14446719884872436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,8,power_law_1.2,0.15602560043334962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,8,power_law_1.2,0.16060800552368165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,8,power_law_1.2,0.18213119506835937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,8,power_law_1.2,0.2138751983642578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,8,power_law_1.2,0.2172800064086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,8,power_law_1.2,0.2791167974472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,8,power_law_1.2,0.3162496089935303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,8,power_law_1.2,0.39582080841064454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,8,power_law_1.2,0.4984000205993652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,8,power_law_1.2,0.6662464141845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,8,power_law_1.2,0.8810303688049317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,balanced,6.955519994099935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,8,power_law_1.2,1.2477631568908691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,8,power_law_1.2,1.611840057373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,8,power_law_1.2,2.1107967376708983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,8,power_law_1.2,3.1421056747436524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,8,power_law_1.2,6.423353576660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,8,power_law_1.2,0.07056000232696533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,8,power_law_1.2,0.08636159896850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,8,power_law_1.2,0.07783039808273315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,8,power_law_1.2,0.07138559818267823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,balanced,0.056421334544817604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,8,power_law_1.2,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,balanced,0.05699199934800466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,balanced,0.06273066500822704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,balanced,0.049584001302719116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,8,power_law_1.2,0.09091200232505799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,balanced,0.07957866787910461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,balanced,0.051455999414126076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,balanced,0.11187199751536052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,8,power_law_1.2,0.10117759704589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,balanced,0.05459199845790863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,balanced,0.17339734236399332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,balanced,0.06545599798361461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,8,power_law_1.2,0.12142080068588257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,balanced,0.2360853354136149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,balanced,0.08919466535250346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,balanced,0.23333867390950522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,balanced,0.12828800082206726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,8,power_law_1.2,0.12563199996948243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,balanced,0.22923199335734049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,balanced,0.16780267159144083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,balanced,0.24089600642522177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,8,power_law_1.2,0.13044480085372925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,balanced,0.1681119998296102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,balanced,0.23956799507141113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,8,power_law_1.2,0.13462400436401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,balanced,0.2463573416074117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,balanced,0.16907199223836264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,balanced,0.253493328889211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,balanced,0.16988799969355264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,8,power_law_1.2,0.14501760005950928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,balanced,0.25990933179855347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,balanced,0.17314666509628296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,8,power_law_1.2,0.14467840194702147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,balanced,0.26867733399073285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,balanced,0.17819199959437051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,8,power_law_1.2,0.1566975951194763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,balanced,0.27406932910283405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,balanced,0.1813653310139974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,8,power_law_1.2,0.1715008020401001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,balanced,0.2590240041414897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,balanced,0.18300267060597739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,8,power_law_1.2,0.1889024019241333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,balanced,0.27949867645899457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,balanced,0.1937333345413208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,balanced,0.06762666503588359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.01,0.06349440217018128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,8,power_law_1.2,0.21298561096191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,balanced,0.19908267259597778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,balanced,0.3004213372866313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,balanced,0.07121066749095917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.01,0.08136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,8,power_law_1.2,0.25155200958251955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,balanced,0.07551466425259908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,balanced,0.20981866121292114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,balanced,0.3397279977798462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,balanced,0.08769067128499348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.01,0.10302079916000366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,balanced,0.2312320073445638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,balanced,0.10984533031781514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,balanced,0.39844799041748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.01,0.07682560086250305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,8,power_law_1.2,0.2846400022506714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,balanced,0.25525333484013873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,balanced,0.14475199580192566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.01,0.09437440037727356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,balanced,0.18478399515151978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,balanced,0.4814026753107707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,balanced,0.3018453319867452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,balanced,0.1877653400103251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.01,0.12448639869689941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,8,power_law_1.2,0.3615744113922119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,balanced,0.1901973287264506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,balanced,0.34718934694925946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.01,0.13492480516433716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,balanced,0.5790239969889323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.01,0.05226879715919495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,8,power_law_1.2,0.4479360103607178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,balanced,0.19292799631754556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.01,0.16142079830169678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,8,power_law_1.2,0.6095359802246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.01,0.0644864022731781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,balanced,0.19710399707158408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,balanced,0.4280159870783488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.01,0.17393280267715455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,balanced,0.19989866018295288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.01,0.08167679905891419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,8,power_law_1.2,0.8229375839233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,balanced,0.7827626864115397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.01,0.17634559869766236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,balanced,0.2062879999478658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,8,power_law_1.2,1.1789119720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.01,0.0624064028263092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,balanced,0.5322719812393188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.01,0.18596479892730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,balanced,0.2144320011138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,8,power_law_1.2,1.2888447761535644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.01,0.07900800108909607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,balanced,0.2273599902788798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.01,0.1974400043487549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,8,power_law_1.2,2.2625215530395506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,balanced,0.23389865954717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.01,0.1034432053565979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.01,0.2034303903579712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,balanced,0.985157330830892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,8,power_law_1.2,2.6475008010864256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,balanced,0.7289493083953857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.01,0.10711040496826171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,balanced,0.25197867552439374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.01,0.21337599754333497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,8,power_law_1.2,3.7469951629638674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.01,0.2432960033416748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.01,0.12590080499649048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,balanced,0.28406399488449097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.01,0.2526655912399292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.01,0.1312384009361267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,8,power_law_1.2,5.906201553344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.01,0.25096960067749025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.01,0.1323904037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,balanced,0.9329813321431478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.01,0.28117759227752687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.01,0.14421759843826293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,8,power_law_1.2,12.214412689208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,balanced,1.3636746406555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.01,0.3200767993927002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.01,0.14621440172195435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,balanced,0.3448479970296224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.01,0.15819519758224487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.01,0.39799039363861083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.01,0.16402560472488403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.01,0.43755521774291994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.01,0.17902079820632935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,balanced,1.347317377726237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.01,0.5324863910675048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.01,0.1874624013900757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.01,0.6409535884857178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.01,0.1982143998146057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.01,0.8337471961975098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,balanced,0.45446399847666424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,balanced,1.6896106402079265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.01,0.2297600030899048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.01,1.0065343856811524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,balanced,0.5393919944763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.01,0.259935998916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.01,1.4393792152404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.01,0.3190975904464722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.01,1.8008384704589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,balanced,0.6695840358734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,balanced,1.6839466094970703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.01,0.35075840950012205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.01,2.2313983917236326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.01,0.454150390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.01,3.616454315185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,balanced,0.8812959988911947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.01,0.5824831962585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.01,0.7801663875579834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.01,6.8040000915527346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,balanced,2.05513604482015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.01,0.9626048088073731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,balanced,1.163413365681966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.01,1.36244478225708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,power_law_1.01,0.0746944010257721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.01,1.8344512939453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,balanced,2.0637332598368325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,power_law_1.01,0.08549759984016418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.01,2.324787139892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,balanced,1.6225919723510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,power_law_1.01,0.10515199899673462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.01,3.6477760314941405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,power_law_1.01,0.09096959829330445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,power_law_1.01,0.09956480264663696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.01,7.57325439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,power_law_1.01,0.11920000314712524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,power_law_1.01,0.12721279859542847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,power_law_1.01,0.14610559940338136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,balanced,2.2166453997294107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,power_law_1.01,0.15841280221939086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,power_law_1.01,0.15918079614639283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,balanced,3.110917409261068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,power_law_1.01,0.17354240417480468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,4,power_law_1.2,0.06347519755363465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,power_law_1.01,0.18159359693527222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,4,power_law_1.2,0.08094080090522766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,power_law_1.01,0.18974080085754394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,balanced,3.2095521291097007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,power_law_1.01,0.2043071985244751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,4,power_law_1.2,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,power_law_1.01,0.2269887924194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,4,power_law_1.2,0.07382400035858154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,power_law_1.01,0.23679358959198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,balanced,3.000149408976237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,4,power_law_1.2,0.08737279772758484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,power_law_1.01,0.2675584077835083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,4,power_law_1.2,0.11064319610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,power_law_1.01,0.32718720436096194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,4,power_law_1.2,0.12914559841156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,4,power_law_1.2,0.16344959735870362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,power_law_1.01,0.4116096019744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,4,power_law_1.2,0.1654080033302307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,4,power_law_1.2,0.1712000012397766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,4,power_law_1.2,0.18755840063095092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,power_law_1.01,0.4726208209991455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,4,power_law_1.2,0.19471999406814575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,power_law_1.01,0.5924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,4,power_law_1.2,0.20435841083526612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,balanced,3.7226826349894204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,4,power_law_1.2,0.2202239990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,power_law_1.01,0.789305591583252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,4,power_law_1.2,0.23792641162872313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,power_law_1.01,1.0089983940124512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,4,power_law_1.2,0.26238079071044923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,power_law_1.01,1.399500846862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,4,power_law_1.2,0.2564287900924683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,power_law_1.01,1.8725248336791993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,4,power_law_1.2,0.2866624116897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,power_law_1.01,2.6091264724731444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,4,power_law_1.2,0.34051198959350587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,power_law_1.01,3.6700160980224608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,4,power_law_1.2,0.4062464237213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,power_law_1.01,4.3665214538574215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,4,power_law_1.2,0.4475584030151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,4,power_law_1.2,0.6004799842834473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,power_law_1.01,6.783487701416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,4,power_law_1.2,0.7022528171539306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,balanced,6.054629643758138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,4,power_law_1.2,0.899289608001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,power_law_1.01,12.73070068359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,4,power_law_1.2,1.0569279670715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,balanced,6.34114138285319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,balanced,5.831104278564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,4,power_law_1.2,1.5253952026367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,4,power_law_1.2,1.9266624450683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,4,power_law_1.2,2.4692352294921873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,4,power_law_1.2,4.046303939819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,4,power_law_1.2,8.071469116210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,4,power_law_1.2,0.05235199928283692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,4,power_law_1.2,0.0646399974822998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,4,power_law_1.2,0.06238719820976257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,4,power_law_1.2,0.06421759724617004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,4,power_law_1.2,0.07580800056457519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,4,power_law_1.2,0.09151999950408936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,4,power_law_1.2,0.09898880124092102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,4,power_law_1.2,0.12092159986495972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,4,power_law_1.2,0.12628480195999145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,balanced,11.426923116048178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,4,power_law_1.2,0.13171199560165406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,4,power_law_1.2,0.1409600019454956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,4,power_law_1.2,0.14894720315933227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,4,power_law_1.2,0.15486719608306884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,4,power_law_1.2,0.16682239770889282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,4,power_law_1.2,0.17781120538711548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,4,power_law_1.2,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,4,power_law_1.2,0.07507200241088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,4,power_law_1.2,0.19829119443893434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,4,power_law_1.2,0.08570240139961242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,4,power_law_1.2,0.236409592628479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,balanced,0.0594400018453598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,4,power_law_1.2,0.08451840281486511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,4,power_law_1.2,0.2714816093444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,4,power_law_1.2,0.0870464026927948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,balanced,0.08191999793052673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,4,power_law_1.2,0.32865281105041505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,balanced,0.09659733374913533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,4,power_law_1.2,0.09786880016326904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,balanced,0.13101333379745483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,4,power_law_1.2,0.36954240798950194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,4,power_law_1.2,0.11126400232315063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,balanced,0.19963733355204263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,4,power_law_1.2,0.12679680585861205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,4,power_law_1.2,0.4751232147216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,balanced,0.278437336285909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,balanced,0.2582346598307292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,4,power_law_1.2,0.14715520143508912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,4,power_law_1.2,0.6131455898284912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,balanced,0.26979732513427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,4,power_law_1.2,0.15237760543823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,4,power_law_1.2,0.8637311935424805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,balanced,0.26212799549102783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,4,power_law_1.2,0.15645439624786378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,balanced,0.2710240085919698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,4,power_law_1.2,1.0050111770629884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,4,power_law_1.2,0.1687999963760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,balanced,0.2764586607615153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,4,power_law_1.2,1.4800064086914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,4,power_law_1.2,0.1804352045059204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,balanced,0.27503466606140137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,4,power_law_1.2,1.9565887451171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,balanced,0.28128000100453693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,4,power_law_1.2,0.19016319513320923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,balanced,0.2918293277422587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,4,power_law_1.2,0.20636799335479736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,4,power_law_1.2,2.4964927673339843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,balanced,0.29607999324798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,4,power_law_1.2,0.22145919799804686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,4,power_law_1.2,3.877977752685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,balanced,0.30953067541122437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,4,power_law_1.2,0.241593599319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,4,power_law_1.2,0.26742401123046877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,balanced,0.34355199337005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,4,power_law_1.2,7.791142272949219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,4,power_law_1.2,0.349945592880249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,balanced,0.37282665570576984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,balanced,0.4405920108159383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,4,power_law_1.2,0.41887359619140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,balanced,0.5322666565577189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,balanced,0.6585013469060262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,4,power_law_1.2,0.49800958633422854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,4,power_law_1.2,0.6091392040252686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,balanced,0.8327039877573649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,4,power_law_1.2,0.8918656349182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,4,power_law_1.2,1.0718527793884278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,balanced,0.05309333403905233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,4,power_law_1.2,1.561619186401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,balanced,0.0562666654586792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,balanced,1.172917366027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,balanced,0.06691200037797292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,4,power_law_1.2,1.9671167373657226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,balanced,0.08295466502507527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,balanced,0.11573333541552226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,4,power_law_1.2,2.9859392166137697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,balanced,0.1668213407198588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,balanced,0.225055992603302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,4,power_law_1.2,3.836492919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,balanced,0.2283733288447062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,balanced,1.5146613121032715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,balanced,0.23041067520777384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,4,power_law_1.2,4.822489547729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,balanced,0.23197867472966513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,balanced,0.2342346707979838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,4,power_law_1.2,7.859123229980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,balanced,0.23907200495402017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.01,0.05806080102920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,balanced,0.2411253253618876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,balanced,0.24445333083470663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.01,0.0800704002380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,4,power_law_1.2,14.335693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,balanced,0.2556533416112264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,balanced,2.1122132937113443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.01,0.09012479782104492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,balanced,0.26690133412679035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.01,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,balanced,0.28032533327738446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,balanced,0.30921600262324017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.01,0.11032320261001587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,balanced,0.350597341855367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.01,0.14052480459213257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,balanced,0.41980799039204914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.01,0.15612800121307374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.01,0.0537663996219635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.01,0.18443520069122316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,balanced,0.4899253447850545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,balanced,2.5632373491923013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.01,0.05811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.01,0.19249919652938843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,balanced,0.6103093226750692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.01,0.07502719759941101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.01,0.19953919649124147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.01,0.07301759719848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.01,0.2119999885559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,balanced,0.7848640282948812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.01,0.0961023986339569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.01,0.2241663932800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.01,0.12306560277938842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.01,0.22957439422607423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.01,0.13649280071258546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.01,0.24213759899139403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,balanced,1.1003306706746419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.01,0.26774399280548095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.01,0.16711039543151857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,balanced,3.1859893798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.01,0.2724031925201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.01,0.16993919610977173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.01,0.2989952087402344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.01,0.17375999689102173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,balanced,1.433824062347412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.01,0.19040000438690186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.01,0.3473536014556885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.01,0.1969215989112854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.01,0.38134400844573973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.01,0.20792319774627685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.01,0.22518401145935057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.01,0.5043263912200928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.01,0.2460223913192749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.01,0.5267199993133544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,balanced,2.088010629018148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.01,0.2590912103652954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.01,0.6920767784118652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.01,0.2699903964996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.01,0.8559616088867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.01,0.31171839237213134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.01,1.156383991241455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.01,0.3660991907119751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.01,1.5461888313293457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.01,0.4623424053192139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,balanced,4.791194597880046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.01,2.2130752563476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.01,0.4978816032409668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,balanced,2.598917325337728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.01,0.6361792087554932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.01,2.6596351623535157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.01,0.7993919849395752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.01,3.2724414825439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.01,1.0910528182983399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.01,4.917734527587891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.01,1.3899904251098634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.01,2.087295913696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.01,2.68603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.01,10.650931549072265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.01,3.2875648498535157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,balanced,3.234842618306478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.01,5.195251083374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.01,11.129747009277343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,balanced,5.062927881876628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,balanced,10.026506423950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,2,power_law_1.2,0.05774719715118408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,2,power_law_1.2,0.07991679906845092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,2,power_law_1.2,0.07541760206222534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,2,power_law_1.2,0.08540800213813782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,2,power_law_1.2,0.10815999507904053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,2,power_law_1.2,0.12884479761123657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,2,power_law_1.2,0.1469696044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,2,power_law_1.2,0.1816256046295166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,2,power_law_1.2,0.18627840280532837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,2,power_law_1.2,0.19610879421234131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,2,power_law_1.2,0.054041600227355956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,2,power_law_1.2,0.2116544008255005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,2,power_law_1.2,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,2,power_law_1.2,0.21918718814849852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,2,power_law_1.2,0.07037439942359924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,2,power_law_1.2,0.22385919094085693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,2,power_law_1.2,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,2,power_law_1.2,0.24371840953826904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,2,power_law_1.2,0.262009596824646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,2,power_law_1.2,0.08960639834403991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,2,power_law_1.2,0.27307519912719724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,2,power_law_1.2,0.11547520160675048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,2,power_law_1.2,0.29612159729003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,2,power_law_1.2,0.12791039943695068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,2,power_law_1.2,0.36124799251556394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,2,power_law_1.2,0.1625663995742798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,balanced,9.934736251831055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,2,power_law_1.2,0.40560002326965333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,2,power_law_1.2,0.16535680294036864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,2,power_law_1.2,0.5176000118255615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,2,power_law_1.2,0.1750656008720398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,2,power_law_1.2,0.5900800228118896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,2,power_law_1.2,0.183078396320343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,2,power_law_1.2,0.7580416202545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,2,power_law_1.2,0.20084478855133056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,2,power_law_1.2,0.9631808280944825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,2,power_law_1.2,0.19579520225524902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,2,power_law_1.2,1.2435263633728026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,2,power_law_1.2,0.22792320251464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,2,power_law_1.2,0.2427903890609741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,2,power_law_1.2,1.5824128150939942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,2,power_law_1.2,0.2617727994918823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,2,power_law_1.2,2.177881622314453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,2,power_law_1.2,0.27148799896240233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,2,power_law_1.2,2.751379203796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,2,power_law_1.2,0.3244352102279663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,2,power_law_1.2,3.228947067260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,2,power_law_1.2,0.37004799842834474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,2,power_law_1.2,0.46811518669128416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,2,power_law_1.2,5.359769439697265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,2,power_law_1.2,0.5084991931915284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,2,power_law_1.2,0.6868735790252686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,2,power_law_1.2,11.043270111083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,2,power_law_1.2,0.8415679931640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,2,power_law_1.2,1.142188835144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,2,power_law_1.2,1.4728320121765137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,2,power_law_1.2,2.1268032073974608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,2,power_law_1.2,2.739129638671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,2,power_law_1.2,3.720703887939453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,balanced,0.056464001536369324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,2,power_law_1.2,5.554751968383789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,power_law_1.01,0.07000319957733155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,balanced,0.05780800183614095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,balanced,0.054458667834599815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,2,power_law_1.2,11.328447723388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,power_law_1.01,0.06030719876289368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,balanced,0.06014933188756307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,power_law_1.01,0.057599997520446776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,balanced,0.08006399869918823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,power_law_1.01,0.05379840135574341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,64,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,balanced,0.09199999769528706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,power_law_1.01,0.061247998476028444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,balanced,0.09052800138791402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,64,power_law_1.2,0.05971199870109558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,power_law_1.01,0.07077760100364686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,balanced,0.10015466809272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,64,power_law_1.2,0.057817602157592775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,power_law_1.01,0.08403840065002441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,balanced,0.0995360016822815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,64,power_law_1.2,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,power_law_1.01,0.07834879755973816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,balanced,0.09802132844924927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,64,power_law_1.2,0.061504000425338747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,power_law_1.01,0.09176959991455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,balanced,0.0937653382619222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,64,power_law_1.2,0.06934400200843811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,power_law_1.01,0.08889600038528442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,balanced,0.10017599662144978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,64,power_law_1.2,0.0834176003932953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,balanced,0.09663466612497966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,power_law_1.01,0.09088000059127807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,balanced,0.04821866750717163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,64,power_law_1.2,0.0802944004535675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,balanced,0.09510933359464009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,power_law_1.01,0.08983680009841918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,balanced,0.049125333627065025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,64,power_law_1.2,0.09653120040893555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,balanced,0.048895999789237976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,power_law_1.01,0.09225599765777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,balanced,0.09833600123723348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,64,power_law_1.2,0.0953279972076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,balanced,0.04726399978001913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,power_law_1.01,0.08992639780044556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,balanced,0.052202666799227394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,64,power_law_1.2,0.08865280151367187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,balanced,0.09678933024406433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,power_law_1.01,0.08963840007781983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,balanced,0.05858666698137919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,64,power_law_1.2,0.09143679738044738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,balanced,0.06459733347098033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,balanced,0.09797333677609761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,power_law_1.01,0.09007999897003174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,balanced,0.06784533460934956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,64,power_law_1.2,0.09041919708251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,balanced,0.10135466853777568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,power_law_1.01,0.09304959774017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,balanced,0.0792906681696574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,64,power_law_1.2,0.09287040233612061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,balanced,0.08003200093905131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,power_law_1.01,0.11008000373840332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,balanced,0.1072746713956197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,balanced,0.08337066570917766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,64,power_law_1.2,0.0958400011062622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,power_law_1.01,0.1220736026763916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,balanced,0.0765119989713033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,64,power_law_1.2,0.09797760248184204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,balanced,0.1167093316713969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,balanced,0.08060800035794576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,power_law_1.01,0.13415679931640626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,64,power_law_1.2,0.1147968053817749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,balanced,0.0814933329820633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,power_law_1.01,0.18659199476242067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,balanced,0.13665067156155905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,64,power_law_1.2,0.12264319658279418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,balanced,0.07886933286984761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,power_law_1.01,0.23392000198364257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,64,power_law_1.2,0.124236798286438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,balanced,0.08021333316961925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,balanced,0.1581546664237976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,balanced,0.07970133423805237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,64,power_law_1.2,0.18344320058822633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,power_law_1.01,0.28022398948669436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,balanced,0.08157866696516673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,64,power_law_1.2,0.20835840702056885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,power_law_1.01,0.46613759994506837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,balanced,0.08474666873613994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,balanced,0.2189120054244995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,64,power_law_1.2,0.29402239322662355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,power_law_1.01,0.5493887901306153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,balanced,0.0916426678498586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,64,power_law_1.2,0.3880000114440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,power_law_1.01,0.8286399841308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,64,power_law_1.2,0.6345471858978271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,balanced,0.0993226667245229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,power_law_1.01,1.0822015762329102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,balanced,0.26152000824610394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,64,power_law_1.2,0.7820799827575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,power_law_1.01,1.3582528114318848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,balanced,0.11660800377527873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,power_law_1.2,0.9791999816894531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,power_law_1.01,2.114892768859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,power_law_1.01,0.07146880030632019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,power_law_1.2,1.617919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,balanced,0.13733333349227905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,64,balanced,0.3829600016276042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,power_law_1.2,2.3690624237060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,power_law_1.01,4.102348709106446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,power_law_1.01,0.06154879927635193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,balanced,0.21198399861653647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,power_law_1.01,0.05232639908790589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,power_law_1.2,3.310579299926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,power_law_1.01,0.049747198820114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,64,balanced,0.4965759913126628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,balanced,0.2515146732330322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,power_law_1.2,8.700940704345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,power_law_1.01,0.05146239995956421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,power_law_1.01,0.05615360140800476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,power_law_1.01,0.06361600160598754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,balanced,0.36346666018168133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,power_law_1.01,0.06572800278663635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,64,balanced,0.6135093371073405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,power_law_1.01,0.08167679905891419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,power_law_1.01,0.08273280262947083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,balanced,0.4723786513010661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,power_law_1.01,0.08169599771499633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,power_law_1.01,0.08684160113334656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,power_law_1.01,0.07875840067863464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,power_law_1.01,0.08112000226974488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,64,balanced,0.9655840396881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,balanced,0.5843679904937744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,power_law_1.01,0.08116480112075805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,power_law_1.01,0.08173440098762512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,power_law_1.01,0.0862272024154663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,power_law_1.01,0.08184959888458251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,power_law_1.01,0.10991359949111938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,32,power_law_1.2,0.07131519913673401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,power_law_1.01,0.1342911958694458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,power_law_1.01,0.14792319536209106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,32,power_law_1.2,0.05909759998321533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,32,power_law_1.2,0.049472001194953916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,power_law_1.01,0.18802560567855836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,balanced,0.9192266464233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,32,power_law_1.2,0.04936319887638092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,power_law_1.01,0.25045759677886964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,32,power_law_1.2,0.05111039876937866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,power_law_1.01,0.31607680320739745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,32,power_law_1.2,0.055641597509384154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,power_law_1.01,0.4626495838165283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,32,power_law_1.2,0.06428800225257873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,32,power_law_1.2,0.06505600214004517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,power_law_1.01,0.649286413192749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,32,power_law_1.2,0.07906559705734253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,power_law_1.01,0.8585087776184082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,32,power_law_1.2,0.08321279883384705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,balanced,0.03386666625738144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,32,power_law_1.2,0.08136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,power_law_1.01,0.9807616233825683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,64,balanced,1.9009653727213542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,32,power_law_1.2,0.08227840065956116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,balanced,0.035877334574858345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,32,power_law_1.2,0.08184319734573364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,power_law_1.01,1.6653247833251954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,balanced,0.03594133257865906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,32,power_law_1.2,0.0832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,power_law_1.01,3.463257598876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,32,power_law_1.2,0.0818880021572113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,balanced,0.040607998768488564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,power_law_1.01,0.035641598701477054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,32,power_law_1.2,0.08787199854850769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,balanced,0.04312000175317129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,32,power_law_1.2,0.08721920251846313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,balanced,0.04394133388996124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,power_law_1.01,0.04319359958171844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,32,power_law_1.2,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,balanced,0.04903466502825419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,power_law_1.01,0.03749760091304779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,32,power_law_1.2,0.127839994430542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,balanced,1.8011306126912434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,32,power_law_1.2,0.14985599517822265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,balanced,0.047872001926104225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,power_law_1.01,0.04193280041217804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,balanced,0.061146666606267296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,32,power_law_1.2,0.16681599617004395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,power_law_1.01,0.0427264004945755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,32,power_law_1.2,0.23578240871429443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,balanced,0.056613331039746605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,power_law_1.01,0.04185599982738495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,balanced,0.05729066828886668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,power_law_1.01,0.04684799909591675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,32,power_law_1.2,0.27502079010009767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,balanced,0.0876639982064565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,power_law_1.01,0.04622080028057098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,32,power_law_1.2,0.4134079933166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,balanced,0.08247999846935272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,power_law_1.01,0.06023039817810059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,32,power_law_1.2,0.560972785949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,balanced,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,32,power_law_1.2,0.8468799591064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,power_law_1.01,0.059487998485565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,balanced,0.07900266846021016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,32,power_law_1.2,0.9977279663085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,power_law_1.01,0.05689600110054016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,balanced,0.08091199894746144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,power_law_1.01,0.08810240030288696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,32,power_law_1.2,1.4397312164306642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,balanced,0.08097599943478902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,power_law_1.01,0.085343998670578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,32,power_law_1.2,2.1182207107543944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,power_law_1.01,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,balanced,0.0841439962387085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,32,power_law_1.2,5.183878326416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,power_law_1.01,0.0843392014503479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,balanced,0.08711999654769897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,power_law_1.01,0.08498560190200806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,balanced,0.09478400150934856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,power_law_1.01,0.08655359745025634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,power_law_1.01,0.09256319999694824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,balanced,0.10216533144315083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,power_law_1.01,0.09660159945487976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,balanced,0.11911466717720032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,power_law_1.01,0.11449600458145141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,power_law_1.01,0.1418239951133728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,balanced,0.13730133573214212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,power_law_1.01,0.1709247946739197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,balanced,0.21331733465194702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,power_law_1.01,0.1875391960144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,power_law_1.01,0.2927615880966187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,power_law_1.01,0.3431616067886353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,balanced,0.2478613257408142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,power_law_1.01,0.5693823814392089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,power_law_1.01,0.7068543910980225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,power_law_1.01,0.8525504112243653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,balanced,0.35755733648935956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,power_law_1.01,1.2731007575988769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,16,power_law_1.2,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,power_law_1.01,2.6215295791625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,16,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,16,power_law_1.2,0.03824000060558319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,balanced,0.4636960029602051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,16,power_law_1.2,0.04225279986858368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,16,power_law_1.2,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,balanced,0.03051200012365977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,16,power_law_1.2,0.042412799596786496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,balanced,0.03317866722742716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,16,power_law_1.2,0.04737280011177063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,balanced,0.5730613470077515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,balanced,0.033743999898433685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,16,power_law_1.2,0.04642559885978699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,balanced,0.03682133307059606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,16,power_law_1.2,0.06112639904022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,balanced,0.04219200213750204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,16,power_law_1.2,0.05818880200386047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,balanced,0.0467199981212616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,16,power_law_1.2,0.05801600217819214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,balanced,0.045941332976023354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,16,power_law_1.2,0.08713600039482117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,balanced,0.04637333254019419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,16,power_law_1.2,0.08403840065002441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,balanced,0.05118933320045471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,balanced,0.8988693555196127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,16,power_law_1.2,0.0887615978717804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,balanced,0.04822933177153269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,16,power_law_1.2,0.08458880186080933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,16,power_law_1.2,0.0918079972267151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,balanced,0.04971200227737427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,16,power_law_1.2,0.09184640049934387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,balanced,0.06198933223883311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,16,power_law_1.2,0.09644799828529357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,balanced,0.05917333563168844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,16,power_law_1.2,0.10417920351028442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,balanced,0.05900266766548157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,16,power_law_1.2,0.13678719997406005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,balanced,0.08763200044631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,16,power_law_1.2,0.1426367998123169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,balanced,0.08226133386294048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,16,power_law_1.2,0.1932927966117859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,balanced,0.08125866452852885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,16,power_law_1.2,0.2248768091201782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,16,power_law_1.2,0.31340799331665037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,balanced,0.08664000034332275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,16,power_law_1.2,0.45175681114196775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,balanced,0.08946133653322856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,balanced,1.7615893681844075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,16,power_law_1.2,0.6181183815002441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,power_law_1.01,0.03111039996147156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,balanced,0.09771200021107991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,16,power_law_1.2,0.7908607959747315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,power_law_1.01,0.03497599959373474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,balanced,0.10690133770306905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,16,power_law_1.2,1.0651519775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,power_law_1.01,0.03440000116825104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,balanced,0.12517333030700684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,16,power_law_1.2,1.6101247787475585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,power_law_1.01,0.03696640133857727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,16,power_law_1.2,3.3505664825439454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,balanced,0.1449066698551178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,power_law_1.01,0.04487679898738861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,balanced,0.028165332973003387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,balanced,0.22499734163284302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,power_law_1.01,0.04425599873065948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,8,power_law_1.2,0.031200000643730165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,balanced,0.02997333308060964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,power_law_1.01,0.04591360092163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,8,power_law_1.2,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,balanced,0.03169599920511246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,balanced,0.26129066944122314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,power_law_1.01,0.05060480237007141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,8,power_law_1.2,0.03208959996700287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,balanced,0.035274667044480644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,8,power_law_1.2,0.0366784006357193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,power_law_1.01,0.04816640019416809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,balanced,0.04166933397452036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,8,power_law_1.2,0.03896960020065308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,power_law_1.01,0.04958719909191132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,balanced,0.052069331208864846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,8,power_law_1.2,0.04499199986457825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,balanced,0.3756106694539388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,balanced,0.051776001850763954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,power_law_1.01,0.0599232017993927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,8,power_law_1.2,0.04431360065937042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,balanced,0.05194133520126343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,8,power_law_1.2,0.04470399916172028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,power_law_1.01,0.059935998916625974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,balanced,0.051125332713127136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,8,power_law_1.2,0.05043839812278748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,power_law_1.01,0.058534401655197146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,balanced,0.05116266508897146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,8,power_law_1.2,0.04843519926071167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,power_law_1.01,0.08811519742012024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,balanced,0.051962668697039284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,8,power_law_1.2,0.04987519979476929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,balanced,0.47677866617838544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,balanced,0.05415999889373779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,8,power_law_1.2,0.060838401317596436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,power_law_1.01,0.085343998670578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,8,power_law_1.2,0.058899199962615965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,power_law_1.01,0.08485760092735291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,power_law_1.01,0.028812798857688903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,balanced,0.05515199899673462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,8,power_law_1.2,0.061292797327041626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,power_law_1.01,0.09374079704284669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,balanced,0.06364800035953522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,power_law_1.01,0.03294720053672791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,8,power_law_1.2,0.0895359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,power_law_1.01,0.09926400184631348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,balanced,0.06533333162466685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,balanced,0.5903199911117554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,8,power_law_1.2,0.08674560189247131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,power_law_1.01,0.03056640028953552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,power_law_1.01,0.11729279756546021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,balanced,0.06639466683069865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,8,power_law_1.2,0.0859391987323761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,power_law_1.01,0.03687680065631867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,power_law_1.01,0.12616319656372071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,balanced,0.09947199622790019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,8,power_law_1.2,0.09262080192565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,power_law_1.01,0.04301440119743347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,balanced,0.10317333539326985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,power_law_1.01,0.16906880140304564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,8,power_law_1.2,0.10179200172424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,power_law_1.01,0.04366720020771027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,power_law_1.01,0.20135040283203126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,8,power_law_1.2,0.13151999711990356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,balanced,0.11217066645622253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,power_law_1.01,0.049158400297164916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,power_law_1.01,0.27111039161682127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,8,power_law_1.2,0.14449280500411987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,power_law_1.01,0.04828799962997436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,balanced,0.12172800302505493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,power_law_1.01,0.33378560543060304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,8,power_law_1.2,0.177401602268219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,power_law_1.01,0.048403200507164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,balanced,0.9223466714223226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,power_law_1.01,0.4760767936706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,balanced,0.14147200187047324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,8,power_law_1.2,0.22279040813446044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,power_law_1.01,0.04801279902458191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,power_law_1.01,0.6157760143280029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,power_law_1.01,0.04912639856338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,8,power_law_1.2,0.28910720348358154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,balanced,0.16343999902407327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,power_law_1.01,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,power_law_1.01,0.7455296039581298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,8,power_law_1.2,0.35627520084381104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,power_law_1.01,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,power_law_1.01,1.1473983764648437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,8,power_law_1.2,0.5547455787658692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,balanced,0.25830399990081787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,power_law_1.01,0.0555840015411377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,4,power_law_1.2,0.028678399324417115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,8,power_law_1.2,0.6358208179473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,power_law_1.01,2.4505983352661134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,power_law_1.01,0.06420480012893677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,4,power_law_1.2,0.03272959887981415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,8,power_law_1.2,0.9327487945556641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,balanced,0.2983466585477193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,power_law_1.01,0.06465920209884643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,4,power_law_1.2,0.031462401151657104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,8,power_law_1.2,1.4447744369506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,power_law_1.01,0.0738752007484436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,4,power_law_1.2,0.03646079897880554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,power_law_1.2,3.230803298950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,power_law_1.01,0.09979519844055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,4,power_law_1.2,0.04229120016098022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,balanced,0.4338080088297526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,power_law_1.01,0.11954560279846191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,4,power_law_1.2,0.04232960045337677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,power_law_1.01,0.14027520418167114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,4,power_law_1.2,0.04775680005550385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,power_law_1.01,0.1551743984222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,8,balanced,1.8033706347147624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,4,power_law_1.2,0.04875519871711731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,power_law_1.01,0.19800959825515746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,balanced,0.5662399927775065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,4,power_law_1.2,0.04839679896831513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,power_law_1.01,0.2223871946334839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,4,power_law_1.2,0.048921599984169006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,power_law_1.01,0.31191039085388184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,4,power_law_1.2,0.04963839948177338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,power_law_1.01,0.39473280906677244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,4,power_law_1.2,0.05422719717025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,4,power_law_1.2,0.05369600057601929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,power_law_1.01,0.5356863975524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,balanced,0.6999200185139974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,4,power_law_1.2,0.05780479907989502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,power_law_1.01,0.6853759765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,4,power_law_1.2,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,power_law_1.01,0.8629631996154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,4,power_law_1.2,0.07162240147590637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,power_law_1.01,1.26692476272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,4,power_law_1.2,0.07367680072784424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,4,power_law_1.2,0.12100479602813721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,power_law_1.01,2.5714176177978514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,4,power_law_1.2,0.12345600128173828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,balanced,1.0958507061004639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,4,power_law_1.2,0.1480831980705261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,4,power_law_1.2,0.1628543972969055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,4,power_law_1.2,0.20712320804595946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,4,power_law_1.2,0.2563776016235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,4,power_law_1.2,0.3222399950027466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,4,power_law_1.2,0.4348735809326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,balanced,0.027610667049884796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,4,power_law_1.2,0.5723584175109864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,balanced,0.029552000264326733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,4,power_law_1.2,0.7720255851745605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,balanced,0.030389333764712017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,4,power_law_1.2,0.9682944297790528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,balanced,0.03468266626199087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,balanced,0.04264533519744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,4,power_law_1.2,1.4600064277648925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,power_law_1.2,2.7908416748046876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,4,balanced,2.1460426648457847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,balanced,0.05588266750176748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,balanced,0.05781333148479462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,power_law_1.01,0.027673599123954774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,balanced,0.05563200016816457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,power_law_1.01,0.029676800966262816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,power_law_1.01,0.02956160008907318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,balanced,0.05535466472307841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,power_law_1.01,0.035596799850463864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,balanced,0.05417066812515259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,power_law_1.01,0.041817599534988405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,balanced,0.05489600201447805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,balanced,0.055071999629338585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,power_law_1.01,0.04457600116729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,balanced,0.05578133463859558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,power_law_1.01,0.0491456001996994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,balanced,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,power_law_1.01,0.050783997774124144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,balanced,0.06117333471775055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,power_law_1.01,0.05196800231933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,balanced,0.06344000001748402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,power_law_1.01,0.05237119793891907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,balanced,0.0654720018307368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,power_law_1.01,0.05243520140647888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,balanced,0.08108800152937572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,power_law_1.01,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,balanced,0.08493866523106892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,power_law_1.01,0.053376001119613645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,balanced,0.13014933466911316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,power_law_1.01,0.06064000129699707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,power_law_1.01,0.060185599327087405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,balanced,0.14148267110188803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,power_law_1.01,0.06761599779129028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,balanced,0.16647467017173767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,power_law_1.01,0.07247359752655029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,power_law_1.01,0.08981119990348815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,balanced,0.1919893423716227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,power_law_1.01,0.09504640102386475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,power_law_1.01,0.15858559608459472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,balanced,0.30822400252024335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,power_law_1.01,0.18009599447250366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,power_law_1.01,0.21856000423431396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,balanced,0.3580160140991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,power_law_1.01,0.2579456090927124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,power_law_1.01,0.35401599407196044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,power_law_1.01,0.42836480140686034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,balanced,0.520799994468689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,power_law_1.01,0.625113582611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,2,power_law_1.2,0.027718400955200194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,power_law_1.01,0.7748032093048096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,2,power_law_1.2,0.0297791987657547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,power_law_1.01,0.9446463584899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,2,power_law_1.2,0.028857600688934327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,power_law_1.01,1.4203712463378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,2,power_law_1.2,0.03439359962940216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,balanced,0.6772533257802328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,2,power_law_1.2,0.038150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,power_law_1.01,2.8536447525024413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,2,power_law_1.2,0.04490239918231964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,balanced,0.042709335684776306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,2,power_law_1.2,0.048416000604629514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,2,power_law_1.2,0.05066239833831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,balanced,0.8367146650950114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,balanced,0.04412800073623657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,2,power_law_1.2,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,power_law_1.01,0.04258559942245484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,2,power_law_1.2,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,balanced,0.04407466451327006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,power_law_1.01,0.04284160137176514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,2,power_law_1.2,0.051737600564956666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,2,power_law_1.2,0.05459200143814087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,2,power_law_1.2,0.05866879820823669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,balanced,0.04951466619968414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,power_law_1.01,0.046105599403381346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,balanced,1.3045706748962402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,2,power_law_1.2,0.06165120005607605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,2,power_law_1.2,0.06093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,2,power_law_1.2,0.06883199810981751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,2,32,power_law_1.2,0.041356799006462094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,2,power_law_1.2,0.07254400253295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,balanced,0.05169066786766052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,2,32,power_law_1.2,0.042105600237846375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,power_law_1.01,0.04917120039463043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,2,power_law_1.2,0.09005439877510071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,2,32,power_law_1.2,0.04251520037651062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,2,power_law_1.2,0.09664639830589294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,2,32,power_law_1.2,0.046393600106239316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,2,power_law_1.2,0.16509439945220947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,2,32,power_law_1.2,0.04895359873771667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,2,power_law_1.2,0.18391040563583375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,2,power_law_1.2,0.2199104070663452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,2,power_law_1.2,0.2762432098388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,2,power_law_1.2,0.34780800342559814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,balanced,0.05741333464781443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,power_law_1.01,0.05573760271072388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,2,power_law_1.2,0.4390719890594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,2,power_law_1.2,0.6195968151092529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,2,32,power_law_1.2,0.05541759729385376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,balanced,2.533402601877848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,2,power_law_1.2,0.8301759719848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,balanced,0.05843733251094818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,2,power_law_1.2,0.931827163696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,power_law_1.01,0.05820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,power_law_1.01,0.05675519704818725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,balanced,0.05807466804981232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,2,power_law_1.2,1.583795166015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,power_law_1.01,0.06646400094032287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,2,32,power_law_1.2,0.05608959794044495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,balanced,0.0671253353357315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,power_law_1.01,0.06605439782142639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,2,power_law_1.2,2.7936511993408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,2,32,power_law_1.2,0.05628160238265991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,power_law_1.01,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,balanced,0.06720533470312755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,balanced,0.03198933353026708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,power_law_1.01,0.03240959942340851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,2,32,power_law_1.2,0.06601600050926208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,power_law_1.01,0.0662335991859436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,balanced,0.06764266888300578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,balanced,0.03294399877389272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,power_law_1.01,0.06718080043792725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,2,32,power_law_1.2,0.06605439782142639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,power_law_1.01,0.03331199884414673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,balanced,0.06693333387374878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,power_law_1.01,0.06811519861221313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,2,32,power_law_1.2,0.0659775972366333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,balanced,0.06783999999364217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,balanced,0.03325333446264267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,power_law_1.01,0.06873599886894226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,2,32,power_law_1.2,0.06590080261230469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,power_law_1.01,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,balanced,0.06858133276303609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,balanced,0.036901332437992096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,power_law_1.01,0.06990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,2,32,power_law_1.2,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,power_law_1.01,0.0366784006357193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,power_law_1.01,0.07369599938392639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,2,32,power_law_1.2,0.06792320013046264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,balanced,0.0690773328145345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,power_law_1.01,0.10396800041198731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,2,32,power_law_1.2,0.06922879815101624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,2,32,power_law_1.2,0.0706496000289917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,power_law_1.01,0.10549119710922242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,balanced,0.07102400064468384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,balanced,0.040287998815377556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,2,32,power_law_1.2,0.07329919934272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,power_law_1.01,0.13426560163497925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,power_law_1.01,0.03919999897480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,balanced,0.07446399827798207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,2,32,power_law_1.2,0.11957119703292847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,power_law_1.01,0.16010240316390992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,power_law_1.2,0.10576000213623046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,power_law_1.01,0.2544895887374878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,2,32,balanced,0.07639466722806294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,power_law_1.2,0.16792320013046264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,power_law_1.01,0.32069759368896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,2,32,balanced,0.08507200082143147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,power_law_1.2,0.1872063994407654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,power_law_1.01,0.4705984115600586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,balanced,0.04230933388074239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,2,32,balanced,0.09513599673906963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,power_law_1.01,0.04190079867839813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,power_law_1.2,0.2786240100860596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,power_law_1.01,0.6269567966461181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,power_law_1.2,0.3571968078613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,2,32,balanced,0.10988266269365947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,power_law_1.01,0.9128704071044922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,power_law_1.2,0.5277696132659913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,power_law_1.01,1.2547712326049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,balanced,0.05115200082461039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,2,32,balanced,0.13326932986577353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,power_law_1.2,0.6590208053588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,power_law_1.01,1.6614912033081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,balanced,0.05018133421738943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,power_law_1.01,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,power_law_1.2,1.0243519783020019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,power_law_1.01,2.494047927856445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,power_law_1.01,0.04899199903011322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,2,32,balanced,0.19840532541275024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,power_law_1.2,1.355180835723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,power_law_1.01,4.986252975463867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,power_law_1.2,1.6881919860839845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,power_law_1.2,2.6798015594482423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,2,32,balanced,0.2458720008532206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,balanced,0.049882665276527405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,balanced,0.05016533533732096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,power_law_1.01,0.050387197732925416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,power_law_1.2,5.362444686889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,balanced,0.05227733155091604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,power_law_1.01,0.05159040093421936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,balanced,0.052154665191968284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,power_law_1.01,0.051648002862930295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,2,32,balanced,0.35574932893117267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,balanced,0.05889600018660227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,power_law_1.01,0.05270400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,balanced,0.05886933207511902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,power_law_1.01,0.058534401655197146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,balanced,0.059024001161257424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,power_law_1.01,0.060140800476074216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,balanced,0.05978133281071981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,power_law_1.01,0.0599232017993927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,2,32,balanced,0.4636213382085164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,power_law_1.01,0.060652798414230345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,balanced,0.06048533320426941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,balanced,0.06435200075308482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,power_law_1.01,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,power_law_1.01,0.07749760150909424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,balanced,0.06620799998442332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,power_law_1.01,0.0834176003932953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,balanced,0.07684800028800964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,2,32,balanced,0.5740906794865926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,power_law_1.01,0.1198848009109497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,16,power_law_1.2,0.03227519989013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,balanced,0.08701333403587341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,power_law_1.01,0.14953600168228148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,16,power_law_1.2,0.032595199346542356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,power_law_1.01,0.197324800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,balanced,0.1142080028851827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,16,power_law_1.2,0.032671999931335446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,power_law_1.01,0.24126720428466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,16,power_law_1.2,0.03653120100498199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,balanced,0.13322133819262186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,power_law_1.01,0.3570240020751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,16,power_law_1.2,0.03924480080604553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,power_law_1.01,0.4922175884246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,16,power_law_1.2,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,balanced,0.1987946629524231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,2,32,balanced,0.9021813074747721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,16,power_law_1.2,0.05127040147781372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,power_law_1.01,0.8051456451416016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,power_law_1.01,1.0250816345214844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,balanced,0.24068800608317056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,16,power_law_1.2,0.0497408002614975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,power_law_1.01,1.2136768341064452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,16,power_law_1.2,0.04990079998970032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,power_law_1.01,1.8229440689086913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,16,power_law_1.2,0.05206400156021118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,balanced,0.34907201925913495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,power_law_1.01,3.6059711456298826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,16,power_law_1.2,0.05367040038108826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,16,power_law_1.2,0.054022401571273804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,balanced,0.4529333511988322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,16,power_law_1.2,0.059436798095703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,16,power_law_1.2,0.05987840294837952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,16,power_law_1.2,0.06000000238418579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,16,power_law_1.2,0.06455680131912231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,16,power_law_1.2,0.06323840022087097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,2,32,balanced,1.7838026682535808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,16,power_law_1.2,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,balanced,0.5622080167134603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,16,power_law_1.2,0.08606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,16,power_law_1.2,0.13029760122299194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,balanced,0.02924266705910365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,16,power_law_1.2,0.15354880094528198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,balanced,0.029834667841593426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,16,power_law_1.2,0.24092159271240235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,balanced,0.0305173322558403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,16,power_law_1.2,0.3257472038269043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,16,power_law_1.2,0.4538623809814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,balanced,0.03462400039037069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,16,power_law_1.2,0.6304831981658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,16,power_law_1.2,1.0436991691589355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,balanced,0.8814613024393717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,balanced,0.03666666646798452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,16,power_law_1.2,1.3839424133300782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,16,power_law_1.2,1.5772607803344727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,balanced,0.03812266637881597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,16,power_law_1.2,2.3628416061401367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,power_law_1.2,5.406355285644532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,power_law_1.01,0.029209598898887634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,balanced,0.04115733255942663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,power_law_1.01,0.030086401104927062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,balanced,0.041536000867684685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,power_law_1.01,0.02993920147418976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,power_law_1.01,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,balanced,0.045007998744646706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,power_law_1.01,0.038124799728393555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,balanced,0.04576533536116282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,power_law_1.01,0.04156160056591034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,balanced,0.046384001771608986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,16,balanced,1.735914707183838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,power_law_1.01,0.04200960099697113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,power_law_1.01,0.04524799883365631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,power_law_1.01,0.04544639885425568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,balanced,0.046112000942230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,power_law_1.01,0.04835839867591858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,balanced,0.04684266448020935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,power_law_1.01,0.04704639911651611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,balanced,0.04867733518282572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,power_law_1.01,0.0474368005990982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,balanced,0.04962133367856344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,power_law_1.01,0.05167359709739685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,balanced,0.056405335664749146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,power_law_1.01,0.05440639853477478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,balanced,0.05749333401521047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,power_law_1.01,0.06293759942054748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,balanced,0.060736000537872314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,balanced,0.027114666998386383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,8,power_law_1.2,0.029625600576400755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,power_law_1.01,0.06455680131912231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,balanced,0.06282133360703786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,balanced,0.02903466671705246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,8,power_law_1.2,0.030067199468612672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,power_law_1.01,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,balanced,0.0817493349313736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,balanced,0.030810666580994923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,8,power_law_1.2,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,power_law_1.01,0.0765504002571106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,balanced,0.03395200024048487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,balanced,0.09089600046475728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,8,power_law_1.2,0.03400320112705231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,power_law_1.01,0.10648959875106812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,balanced,0.034661332766215004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,8,power_law_1.2,0.03553920090198517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,balanced,0.11450133721033733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,power_law_1.01,0.1124608039855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,8,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,balanced,0.033717334270477295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,power_law_1.01,0.16015360355377198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,8,power_law_1.2,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,balanced,0.13845866918563843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,power_law_1.01,0.2070847988128662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,8,power_law_1.2,0.04209280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,balanced,0.03659733384847641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,power_law_1.01,0.29919359683990476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,balanced,0.20639467239379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,8,power_law_1.2,0.04562560021877289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,power_law_1.01,0.4028480052947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,8,power_law_1.2,0.04880639910697937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,balanced,0.03527999917666117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,8,power_law_1.2,0.0469184011220932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,power_law_1.01,0.5703423976898193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,balanced,0.2521333297093709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,8,power_law_1.2,0.04731520116329193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,power_law_1.01,0.7040319919586182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,8,power_law_1.2,0.047443199157714847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,balanced,0.04012266546487808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,power_law_1.01,0.8982912063598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,8,power_law_1.2,0.05070719718933105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,balanced,0.36484265327453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,balanced,0.03993066648642222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,power_law_1.01,1.521491241455078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,8,power_law_1.2,0.05420799851417542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,balanced,0.0384853333234787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,8,power_law_1.2,0.06357120275497437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,power_law_1.01,3.240358352661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,8,power_law_1.2,0.06665599942207337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,power_law_1.01,0.028095999360084535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,balanced,0.4642719825108846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,8,power_law_1.2,0.07538560032844543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,power_law_1.01,0.029683199524879456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,8,power_law_1.2,0.08474239706993103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,balanced,0.05217066903909048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,power_law_1.01,0.02985599935054779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,8,power_law_1.2,0.10804480314254761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,balanced,0.05323199927806854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,power_law_1.01,0.032953599095344545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,8,power_law_1.2,0.14831360578536987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,balanced,0.04804799954096476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,balanced,0.5753920078277588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,8,power_law_1.2,0.1932096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,power_law_1.01,0.033139199018478394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,balanced,0.05027199784914652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,8,power_law_1.2,0.22823679447174072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,power_law_1.01,0.03695360124111176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,balanced,0.05373333394527435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,8,power_law_1.2,0.3399616003036499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,power_law_1.01,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,balanced,0.05574400226275126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,8,power_law_1.2,0.4498176097869873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,power_law_1.01,0.04022400081157684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,balanced,0.06507200002670288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,8,power_law_1.2,0.7283071994781494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,power_law_1.01,0.04035840034484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,balanced,0.07036266724268596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,8,power_law_1.2,1.0554495811462403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,power_law_1.01,0.04087679982185364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,balanced,0.9014933109283447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,power_law_1.01,0.055731201171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,balanced,0.08916266759236653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,8,power_law_1.2,1.347334384918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,power_law_1.01,0.05431680083274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,8,power_law_1.2,2.3324928283691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,balanced,0.09727467099825542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,power_law_1.01,0.05717759728431702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,4,power_law_1.2,0.02789120078086853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,power_law_1.2,3.841849517822266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,power_law_1.01,0.054579198360443115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,balanced,0.12557333707809448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,4,power_law_1.2,0.030355200171470642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,power_law_1.01,0.05799679756164551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,4,power_law_1.2,0.03075839877128601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,balanced,0.15478400389353433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,power_law_1.01,0.06259840130805969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,4,power_law_1.2,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,power_law_1.01,0.07568640112876893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,4,power_law_1.2,0.034329599142074584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,balanced,0.23177067438761392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,power_law_1.01,0.08275840282440186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,balanced,0.02624000112215678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,4,power_law_1.2,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,power_law_1.01,0.09908480048179627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,balanced,0.0281333327293396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,4,power_law_1.2,0.036985599994659425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,balanced,0.02926933268706004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,power_law_1.01,0.1323456048965454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,balanced,0.033520000676314034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,4,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,balanced,0.28866666555404663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,power_law_1.01,0.16660480499267577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,balanced,0.034688000877698265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,4,power_law_1.2,0.040608000755310056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,power_law_1.01,0.20999679565429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,8,balanced,1.7707947095235188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,balanced,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,4,power_law_1.2,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,balanced,0.035173334181308746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,power_law_1.01,0.3344831943511963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,balanced,0.03430933256944021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,4,power_law_1.2,0.041196799278259276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,balanced,0.42045867443084717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,power_law_1.01,0.4308800220489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,4,power_law_1.2,0.05511680245399475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,balanced,0.03692266593376795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,power_law_1.01,0.6636159896850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,4,power_law_1.2,0.055980801582336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,balanced,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,power_law_1.01,0.8260352134704589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,4,power_law_1.2,0.06058239936828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,power_law_1.01,1.0408448219299316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,4,power_law_1.2,0.05634559988975525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,balanced,0.5511519908905029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,balanced,0.03623999903599421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,4,power_law_1.2,0.06208639740943909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,power_law_1.01,1.4087424278259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,4,power_law_1.2,0.06368640065193176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,power_law_1.01,3.0476095199584963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,balanced,0.04238933324813843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,4,power_law_1.2,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,power_law_1.01,0.026726400852203368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,balanced,0.043391997615496315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,4,power_law_1.2,0.0887167990207672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,power_law_1.01,0.027692800760269164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,balanced,0.6813279787699381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,power_law_1.01,0.028224000334739686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,4,power_law_1.2,0.10097919702529908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,balanced,0.040976000328858696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,power_law_1.01,0.031839999556541446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,4,power_law_1.2,0.11614079475402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,power_law_1.01,0.03365119993686676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,4,power_law_1.2,0.21784958839416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,power_law_1.01,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,4,power_law_1.2,0.23519361019134521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,power_law_1.01,0.03480960130691528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,balanced,0.05643199880917867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,4,power_law_1.2,0.3594559907913208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,balanced,0.05746666590372721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,power_law_1.01,0.03553920090198517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,4,power_law_1.2,0.5098112106323243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,balanced,1.0716959635416667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,power_law_1.01,0.037945601344108584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,4,power_law_1.2,0.6219456195831299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,power_law_1.01,0.038438400626182555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,4,power_law_1.2,0.862662410736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,power_law_1.01,0.03966720104217529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,balanced,0.054773335655530296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,power_law_1.01,0.04268800020217896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,4,power_law_1.2,1.1277952194213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,balanced,0.06470400094985962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,power_law_1.01,0.04424319863319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,balanced,0.07297066847483318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,4,power_law_1.2,1.845510482788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,power_law_1.01,0.0456959992647171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,balanced,0.09860799709955852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,power_law_1.01,0.061913597583770755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,power_law_1.2,3.559641647338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,balanced,0.10818666219711304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,power_law_1.01,0.06515840291976929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,balanced,0.14434132973353067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,power_law_1.01,0.06873599886894226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,balanced,0.18067733446756998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,power_law_1.01,0.07660800218582153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,power_law_1.01,0.09276800155639649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,balanced,0.27215999364852905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,power_law_1.01,0.10493439435958862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,4,balanced,2.099850654602051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,power_law_1.01,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,balanced,0.342901349067688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,power_law_1.01,0.16193920373916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,power_law_1.01,0.23177599906921387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,power_law_1.01,0.32083840370178224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,balanced,0.500656008720398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,power_law_1.01,0.4474048137664795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,power_law_1.01,0.5998591899871826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,2,power_law_1.2,0.026495999097824095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,power_law_1.01,0.7497151851654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,2,power_law_1.2,0.02794879972934723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,balanced,0.658735990524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,2,power_law_1.2,0.028217598795890808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,power_law_1.01,1.0367679595947266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,2,power_law_1.2,0.03128319978713989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,2,power_law_1.2,0.033369600772857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,power_law_1.01,1.59617919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,2,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,2,power_law_1.2,0.034860798716545106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,power_law_1.01,3.2669567108154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,2,power_law_1.2,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,2,power_law_1.2,0.03878400027751923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,balanced,0.812666654586792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,2,power_law_1.2,0.039001598954200745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,balanced,0.03656533360481262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,2,power_law_1.2,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,2,power_law_1.2,0.043244799971580504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,balanced,0.031712000568707786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,balanced,0.03233599911133448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,2,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,balanced,0.032586666444937386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,2,power_law_1.2,0.04593279957771301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,balanced,0.03309333324432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,2,power_law_1.2,0.06172159910202026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,balanced,0.03385599950949351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,balanced,0.03551466763019562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,balanced,0.033200000723203026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,balanced,1.2756319840749104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,2,power_law_1.2,0.06403200030326843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,balanced,0.038506666819254555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,balanced,0.03603733330965042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,2,power_law_1.2,0.0689087986946106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,balanced,0.039994666973749794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,balanced,0.03577066709597906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,2,power_law_1.2,0.07554559707641602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,balanced,0.038431999584039055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,balanced,0.037962667644023895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,2,power_law_1.2,0.08831359744071961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,balanced,0.03849066545565923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,balanced,0.0377866675456365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,2,power_law_1.2,0.1040768027305603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,balanced,0.038949333131313324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,balanced,0.038133333126703896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,2,power_law_1.2,0.12499840259552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,balanced,0.0397173340121905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,balanced,0.038848000268141426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,2,power_law_1.2,0.17985279560089112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,balanced,0.03982933362325033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,balanced,0.03825066735347112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,balanced,0.04298666616280874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,2,power_law_1.2,0.22481279373168944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,balanced,0.03881600002447764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,balanced,0.04403733213742574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,2,power_law_1.2,0.33628799915313723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,balanced,0.039264000952243805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,balanced,0.044069334864616394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,balanced,0.03653866549332937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,2,power_law_1.2,0.4963712215423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,balanced,0.036848001182079315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,balanced,0.05093333125114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,2,power_law_1.2,0.6364736080169677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,balanced,0.04012266546487808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,balanced,0.04855999847253164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,2,power_law_1.2,0.8009663581848144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,balanced,0.038047999143600464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,balanced,0.06779733300209045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,balanced,0.04196799794832865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,balanced,2.4920266469319663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,2,power_law_1.2,1.0578368186950684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,balanced,0.06182933350404104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,balanced,0.041589332123597465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,2,power_law_1.2,1.5902463912963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,balanced,0.08595200379689534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,balanced,0.04320000112056732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,balanced,0.05282666782538096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,2,power_law_1.2,3.251724624633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,balanced,0.08538132905960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,balanced,0.05142400165398916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,balanced,0.12961600224177042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,balanced,0.07295999924341838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,balanced,0.0748533308506012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,balanced,0.13829867045084634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,balanced,0.10166933139165242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,balanced,0.026015999416510265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,balanced,0.21570666631062826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,balanced,0.11486400167147319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,balanced,0.025946666797002155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,balanced,0.1613866686820984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,balanced,0.025914666553338368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,balanced,0.18889600038528442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,balanced,0.027930667002995808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,balanced,0.027493332823117573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,balanced,0.02848000079393387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,balanced,0.27781333525975543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,balanced,0.3232373396555583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,balanced,0.028805332879225414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,balanced,0.02869333326816559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,balanced,0.029290666182835896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,balanced,0.33952001730600995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.01,0.031244799494743347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.01,0.031411200761795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,balanced,0.4866933425267537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.01,0.03208320140838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,balanced,0.42893866697947186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.01,0.03238399922847748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,balanced,0.02850666642189026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.01,0.04053759872913361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,balanced,0.029274667302767437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.01,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.01,0.03854719996452331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.01,0.03457280099391937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,balanced,0.02869333326816559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,balanced,0.6522560119628906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.01,0.03953920006752014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.01,0.03475840091705322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.01,0.0416703999042511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,balanced,0.8484586874643961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.01,0.034668800234794614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.01,0.04197759926319122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.01,0.04873600006103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.01,0.037676799297332766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,balanced,0.035605333745479584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.01,0.0506816029548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.01,0.037452799081802365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,balanced,0.035690667728583016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.01,0.05459200143814087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,balanced,0.03571200122435888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.01,0.06257280111312866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,balanced,1.2386079629262288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.01,0.06875519752502442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.01,0.036908799409866334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.01,0.07048320174217224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.01,0.03814400136470795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.01,0.08121600151062011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.01,0.03824000060558319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,power_law_1.01,0.02561280131340027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.01,0.09958400130271912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,balanced,0.04248000184694926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.01,0.0392192006111145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.01,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,balanced,0.043552001317342125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,power_law_1.01,0.0255295991897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.01,0.1442944049835205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.01,0.041631999611854556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.01,0.19765119552612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,power_law_1.01,0.025388801097869874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.01,0.0427264004945755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.01,0.2402496099472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,power_law_1.01,0.027212798595428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.01,0.05422719717025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.01,0.34277119636535647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,power_law_1.01,0.027296000719070436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.01,0.056531202793121335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.01,0.3534656047821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,power_law_1.01,0.028780800104141236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.01,0.06683520078659058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,balanced,0.05541333556175232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.01,0.5468287944793702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,power_law_1.01,0.028435200452804565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.01,0.08320639729499817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,power_law_1.01,0.028940799832344054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.01,0.7306816101074218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.01,0.08755199909210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,power_law_1.01,0.030118399858474733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.01,0.11138559579849243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.01,0.9455807685852051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.01,0.125491201877594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.01,1.5876735687255858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.01,0.15460480451583863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,balanced,0.063360000650088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,power_law_1.01,0.03716480135917664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.01,0.19254399538040162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.01,2.4412288665771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,power_law_1.01,0.03948799967765808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.01,0.28304638862609866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,power_law_1.01,0.042335999011993405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.01,0.3340543985366821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,power_law_1.01,0.04821760058403015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,balanced,0.08140799899895985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.01,0.5046592235565186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.01,0.6552512168884277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.01,0.8130944252014161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,power_law_1.01,0.051520001888275144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.01,1.3993408203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,power_law_1.01,0.055615997314453124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,balanced,0.09866666793823242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,power_law_1.01,0.06767359972000123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.01,2.515020751953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,balanced,0.1372106671333313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,16,8,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,power_law_1.01,0.07964800000190735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,balanced,0.16927999258041382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,16,8,power_law_1.2,0.03198080062866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,16,8,power_law_1.2,0.03214080035686493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,power_law_1.01,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,16,8,power_law_1.2,0.03244799971580505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,16,8,power_law_1.2,0.032076799869537355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,balanced,0.25697600841522217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,16,8,power_law_1.2,0.03325439989566803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,16,8,power_law_1.2,0.032332798838615416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,16,8,power_law_1.2,0.03375999927520752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,power_law_1.01,0.1142016053199768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,16,8,power_law_1.2,0.03436160087585449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,16,8,power_law_1.2,0.04199039936065674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,balanced,0.34095998605092365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,16,8,power_law_1.2,0.03412480056285858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,16,8,power_law_1.2,0.042847999930381776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,16,8,power_law_1.2,0.03770880103111267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,16,8,power_law_1.2,0.03462400138378143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,power_law_1.01,0.1381119966506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,16,8,power_law_1.2,0.03841919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,16,8,power_law_1.2,0.03740800023078918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,16,8,power_law_1.2,0.03835520148277283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,balanced,0.41954131921132404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,16,8,power_law_1.2,0.03726719915866852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,16,8,power_law_1.2,0.04141440093517303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,power_law_1.01,0.2312704086303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,16,8,power_law_1.2,0.0492031991481781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,16,8,power_law_1.2,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,16,8,power_law_1.2,0.03864319920539856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,16,8,power_law_1.2,0.049907198548316954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,power_law_1.01,0.27429120540618895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,16,8,power_law_1.2,0.054048001766204834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,16,8,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,power_law_1.01,0.4542208194732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,16,8,power_law_1.2,0.06396160125732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,16,8,power_law_1.2,0.04306559860706329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,balanced,0.6464586655298868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,16,8,power_law_1.2,0.06888960003852844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,power_law_1.01,0.5367040157318115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,16,8,power_law_1.2,0.041280001401901245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,16,8,power_law_1.2,0.06901119947433472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,16,8,power_law_1.2,0.04343039989471435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,power_law_1.01,0.8050623893737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,16,8,power_law_1.2,0.08778240084648133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,16,8,power_law_1.2,0.04983679950237274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,16,8,power_law_1.2,0.0996288001537323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,power_law_1.01,1.0416319847106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,16,8,power_law_1.2,0.13199360370635987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,16,8,power_law_1.2,0.05565440058708191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,16,8,power_law_1.2,0.13887360095977783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,power_law_1.01,1.2882623672485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,16,8,power_law_1.2,0.06362879872322083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,16,8,power_law_1.2,0.19505280256271362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,power_law_1.01,2.055001640319824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,16,8,power_law_1.2,0.08351359963417053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,16,8,power_law_1.2,0.23256320953369142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,16,8,power_law_1.2,0.34776959419250486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,16,8,power_law_1.2,0.08650239706039428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,power_law_1.01,3.9566078186035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,balanced,1.2786026795705159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,16,8,power_law_1.2,0.38470399379730225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,16,8,power_law_1.2,0.1154047966003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,16,8,power_law_1.2,0.560268783569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,16,8,power_law_1.2,0.1246783971786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,16,8,power_law_1.2,0.7091263771057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,16,8,power_law_1.2,0.17242239713668822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,16,8,power_law_1.2,0.9141183853149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,16,8,power_law_1.2,1.6759040832519532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,16,8,power_law_1.2,0.2063999891281128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,16,8,power_law_1.2,0.2731328010559082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,16,8,power_law_1.2,2.7117952346801757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,16,8,power_law_1.2,0.025465598702430724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,16,8,power_law_1.2,0.3763904094696045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,16,8,power_law_1.2,0.02565760016441345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,16,8,power_law_1.2,0.5207808017730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,16,8,power_law_1.2,0.02545279860496521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,16,8,power_law_1.2,0.7062592029571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,balanced,0.033359999457995095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,16,8,power_law_1.2,0.02741119861602783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,16,8,power_law_1.2,0.8950207710266114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,balanced,0.029343999922275543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,16,8,power_law_1.2,0.027385601401329042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,16,8,power_law_1.2,1.4888128280639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,balanced,0.031141333281993866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,16,8,power_law_1.2,0.028646400570869444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,balanced,0.03236799935499827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,16,8,power_law_1.2,0.028799998760223388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,16,8,power_law_1.2,2.4856000900268556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,balanced,0.032773333291212715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,16,8,power_law_1.2,0.02919679880142212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,balanced,0.033520000676314034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,16,8,power_law_1.2,0.030144000053405763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,16,8,power_law_1.2,0.031692799925804135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,balanced,0.031178665657838184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,balanced,0.04035733391841253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,balanced,0.03698666642109553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,16,8,power_law_1.2,0.0359360009431839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,balanced,0.03750933210055033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,balanced,0.03806933263937632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,16,8,power_law_1.2,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,balanced,0.038736000657081604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,16,8,power_law_1.2,0.04511359930038452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,balanced,0.03856533269087473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,16,8,power_law_1.2,0.05025920271873474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,balanced,0.03886933376391729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,balanced,0.044624000787734985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,16,8,power_law_1.2,0.05319039821624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,balanced,0.04571199913819631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,16,8,power_law_1.2,0.05948160290718078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,balanced,0.04750399788220724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,16,8,power_law_1.2,0.07015680074691773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,balanced,0.062352001667022705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,balanced,0.05435733497142792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,balanced,0.07237333556016286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,16,8,power_law_1.2,0.0775168001651764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,balanced,0.06949333349863689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,16,8,power_law_1.2,0.09697920083999634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,balanced,0.09643733501434326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,balanced,0.10031466682751973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,16,8,power_law_1.2,0.1310464024543762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,balanced,0.032272001107533775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,balanced,0.1499786674976349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,balanced,0.03212266663710276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,16,8,power_law_1.2,0.14117759466171265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,balanced,0.17147199312845865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,16,8,power_law_1.2,0.21777920722961425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,balanced,0.035258665680885315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,balanced,0.26712000370025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,balanced,0.034373333056767784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,16,8,power_law_1.2,0.2912192106246948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,balanced,0.034901333351929985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,16,8,power_law_1.2,0.4396480083465576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,16,8,power_law_1.2,0.5086592197418213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,balanced,0.03554133325815201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,balanced,0.31094932556152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,balanced,0.0258240004380544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,balanced,0.035360001027584076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,16,8,power_law_1.2,0.8303423881530761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,balanced,0.025637333591779072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,16,8,power_law_1.2,1.1177151679992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,balanced,0.03628266602754593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,balanced,0.026101333399613697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,16,8,power_law_1.2,1.3851967811584474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,balanced,0.3999679883321126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,balanced,0.03696000079313914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,balanced,0.028165332973003387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,16,8,power_law_1.2,1.9570432662963868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,balanced,0.03659199923276901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,balanced,0.027786667148272198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,16,8,power_law_1.2,4.041625595092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,balanced,0.028607999285062153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,balanced,0.03743999948104223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,balanced,0.029103999336560566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,balanced,0.038245332737763725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,balanced,0.6141440073649088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,balanced,0.0284853329261144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,balanced,0.03863999992609024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,balanced,0.04359999795754751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,balanced,0.03054400036732356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,balanced,0.04340266684691111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,balanced,0.04489066700140635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,balanced,0.05113600194454193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,balanced,0.05634133517742157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,balanced,0.02938133229811986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.01,0.03341439962387085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,balanced,0.030437332888444264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,balanced,1.08787735303243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,balanced,0.07613333563009898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,balanced,0.03127466638882955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.01,0.03054719865322113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,balanced,0.08237866560618083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,balanced,0.030613332986831665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.01,0.029951998591423036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,balanced,0.11166933178901672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.01,0.03160960078239441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.01,0.03203839957714081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,balanced,0.13057600458463034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.01,0.03718400001525879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,balanced,0.18152532974878946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.01,0.046540799736976626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,balanced,0.03806400050719579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.01,0.03329919874668121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.01,0.03700479865074158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,balanced,0.03842666745185852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.01,0.03265919983386993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,balanced,0.2219466765721639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.01,0.03982079923152924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,balanced,0.039488000174363456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.01,0.03617280125617981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.01,0.03874559998512268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.01,0.03550080060958862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,power_law_1.01,0.025516799092292784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.01,0.041382399201393125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,balanced,0.32570133606592816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.01,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,balanced,0.04860800007979075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,power_law_1.01,0.025260800123214723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.01,0.035097599029541016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.01,0.04242559969425201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.01,0.036006399989128114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,power_law_1.01,0.02588160037994385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.01,0.04354560077190399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,balanced,0.05183466772238413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.01,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,balanced,0.4034080108006795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,4,power_law_1.2,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,power_law_1.01,0.02733440101146698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.01,0.03864319920539856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.01,0.05016319751739502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,power_law_1.01,0.02776319980621338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.01,0.03971840143203735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,4,power_law_1.2,0.030118399858474733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.01,0.04044159948825836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,power_law_1.01,0.028940799832344054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,4,power_law_1.2,0.0297791987657547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.01,0.04137600064277649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,balanced,0.505781332651774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,power_law_1.01,0.028838399052619933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.01,0.05920000076293945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.01,0.041875201463699344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,4,power_law_1.2,0.0321727991104126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,balanced,0.06730666756629944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.01,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,power_law_1.01,0.03136639893054962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.01,0.06643840074539184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,4,power_law_1.2,0.0322816014289856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.01,0.049267199635505673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,power_law_1.01,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.01,0.052857601642608644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.01,0.07401599884033203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,4,power_law_1.2,0.04049279987812042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,power_law_1.01,0.032518398761749265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.01,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,4,power_law_1.2,0.04392960071563721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.01,0.08951680064201355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.01,0.06996480226516724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,balanced,0.7774293422698975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,balanced,0.07834666470686595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.01,0.08268160223960877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.01,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,4,power_law_1.2,0.03808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,power_law_1.01,0.03643519878387451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.01,0.10661120414733886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,4,power_law_1.2,0.038975998759269714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.01,0.10705280303955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.01,0.11323519945144653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,power_law_1.01,0.03943040072917938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,4,power_law_1.2,0.039136001467704774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.01,0.1402943968772888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.01,0.15633920431137086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,power_law_1.01,0.04249599874019623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,balanced,0.10924266775449117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.01,0.19321600198745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.01,0.17204480171203612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,4,power_law_1.2,0.04173440039157868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.01,0.27358720302581785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,power_law_1.01,0.04806399941444397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.01,0.21111679077148438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,4,power_law_1.2,0.04311679899692535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.01,0.35751678943634035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.01,0.3260479927062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,4,power_law_1.2,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.01,0.6451903820037842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,4,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.01,0.3612735986709595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,balanced,1.5833226839701335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.01,0.6770175933837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,balanced,0.13158399860064188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,power_law_1.01,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.01,0.5991680145263671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,4,power_law_1.2,0.06113280057907104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.01,0.8849599838256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.01,1.411359977722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,balanced,0.20642666021982828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.01,0.7170048236846924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,power_law_1.01,0.05334399938583374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,4,power_law_1.2,0.06609280109405517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.01,3.0177791595458983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.01,0.8309247970581055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,4,power_law_1.2,0.07089920043945312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,balanced,0.2665226658185323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.01,1.805120086669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,4,power_law_1.2,0.09286400079727172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,4,power_law_1.2,0.09887359738349914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.01,2.348748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,power_law_1.01,0.09184640049934387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,balanced,0.3848373492558797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,4,power_law_1.2,0.14303359985351563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,4,power_law_1.2,0.12572159767150878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,power_law_1.01,0.13036799430847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,balanced,0.5008906523386637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,4,power_law_1.2,0.2135999917984009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,power_law_1.01,0.1757696032524109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,4,power_law_1.2,0.23149440288543702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,balanced,0.6232959826787313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,4,power_law_1.2,0.2790015935897827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,power_law_1.01,0.2529088020324707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,4,power_law_1.2,0.3754879951477051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,4,power_law_1.2,0.625055980682373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,power_law_1.01,0.298854398727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,4,power_law_1.2,0.7585279941558838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,power_law_1.01,0.4401343822479248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,balanced,0.975488026936849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,4,power_law_1.2,1.018892765045166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,power_law_1.01,0.535423994064331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,4,power_law_1.2,1.7759872436523438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,power_law_1.01,0.8971072196960449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,power_law_1.01,1.0563712120056152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,4,power_law_1.2,3.1677631378173827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,power_law_1.01,1.4134400367736817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,power_law_1.01,2.500230407714844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,4,power_law_1.2,0.03253760039806366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,power_law_1.01,5.679999923706054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,4,power_law_1.2,0.033580800890922545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,balanced,1.9329759279886882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,4,power_law_1.2,0.03265919983386993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,4,power_law_1.2,0.03550719916820526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,4,power_law_1.2,0.03431040048599243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,4,power_law_1.2,0.0345984011888504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,4,power_law_1.2,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,4,power_law_1.2,0.0377920001745224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,4,power_law_1.2,0.03899520039558411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,4,power_law_1.2,0.03792639970779419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,4,power_law_1.2,0.02677760124206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,4,power_law_1.2,0.03834240138530731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,4,power_law_1.2,0.04035840034484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,4,power_law_1.2,0.025945600867271424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,4,power_law_1.2,0.04058879911899567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,4,power_law_1.2,0.025721600651741026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,4,power_law_1.2,0.045900800824165346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,4,power_law_1.2,0.027603200078010558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,4,power_law_1.2,0.04911360144615173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,4,power_law_1.2,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,4,power_law_1.2,0.051660799980163576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,4,power_law_1.2,0.028889599442481994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,4,power_law_1.2,0.05674880146980286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,4,power_law_1.2,0.029395198822021483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,4,power_law_1.2,0.030137598514556885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,4,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,4,power_law_1.2,0.03265919983386993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,4,power_law_1.2,0.08030080199241638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,4,power_law_1.2,0.032793599367141726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,4,power_law_1.2,0.10933760404586793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,4,power_law_1.2,0.13392640352249147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,4,power_law_1.2,0.03475199937820435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,4,power_law_1.2,0.1813055992126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,4,power_law_1.2,0.19740159511566163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,4,power_law_1.2,0.03914879858493805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,4,power_law_1.2,0.2739135980606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,4,power_law_1.2,0.04077439904212952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,4,power_law_1.2,0.04738560020923614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,4,power_law_1.2,0.3752255916595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,4,power_law_1.2,0.6028480052947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,4,power_law_1.2,0.05888640284538269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,4,power_law_1.2,0.8518143653869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,4,power_law_1.2,0.060121601819992064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,4,power_law_1.2,1.0233728408813476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,4,power_law_1.2,0.06921600103378296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,4,power_law_1.2,1.5153535842895507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,4,power_law_1.2,0.0710207998752594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,4,power_law_1.2,3.164748764038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,4,power_law_1.2,0.08981119990348815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,balanced,0.04937066634496053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,balanced,0.04138666639725367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,balanced,0.045050665736198425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,balanced,0.04201066493988037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,balanced,0.0452106644709905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,balanced,0.04177066683769226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,4,power_law_1.2,0.1301375985145569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,balanced,0.047168001532554626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,balanced,0.043141335248947144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,balanced,0.042709335684776306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,balanced,0.04868799944718679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,balanced,0.04463466505209605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,balanced,0.048800001541773476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,4,power_law_1.2,0.1688704013824463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,balanced,0.04599999884764353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,balanced,0.048698668678601585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,balanced,0.03839466720819473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,balanced,0.048101335763931274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,4,power_law_1.2,0.26209919452667235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,balanced,0.04514666895071665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,balanced,0.049498667319615684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,balanced,0.04541333516438802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,balanced,0.04807466765244802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,4,power_law_1.2,0.3386624097824097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,balanced,0.04112533231576284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,balanced,0.04830400149027506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,balanced,0.04213866591453552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,4,power_law_1.2,0.45160961151123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,balanced,0.049973333875338234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,balanced,0.04287999868392944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,4,power_law_1.2,0.5677504062652587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,balanced,0.050053333242734276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,balanced,0.04422933359940847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,4,power_law_1.2,1.0378560066223144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,balanced,0.049829334020614624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,balanced,0.05235733091831207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,4,power_law_1.2,1.3927743911743165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,balanced,0.058373332023620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,balanced,0.05413866539796194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,4,power_law_1.2,1.410425567626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,balanced,0.05783999959627787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,balanced,0.053914666175842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,4,power_law_1.2,2.661952018737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,balanced,0.0295413335164388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,balanced,0.05877333382765452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,balanced,0.06622399886449178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,4,power_law_1.2,5.551232147216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,balanced,0.06479466458161671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,balanced,0.029482667644818623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,balanced,0.06951466699441274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,balanced,0.02945599953333537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,balanced,0.06929066777229309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,balanced,0.0865066647529602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,balanced,0.03166399896144867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,balanced,0.07804266611735027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,balanced,0.0958133339881897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,balanced,0.03139200061559677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,balanced,0.13568533460299173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,balanced,0.0817333310842514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,balanced,0.03189333279927572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,balanced,0.032560000816980995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,balanced,0.124208003282547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,balanced,0.1558613379796346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,balanced,0.03218133250872294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,balanced,0.12406933307647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,balanced,0.032816000282764435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,balanced,0.22109333674112955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,balanced,0.03398400048414866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.01,0.04100480079650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.01,0.05251200199127197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,balanced,0.18557866414388022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,balanced,0.27081600824991864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.01,0.04134399890899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.01,0.04661119878292084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,balanced,0.21734933058420816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.01,0.04156160056591034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.01,0.04609279930591583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,power_law_1.01,0.029190400242805482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,balanced,0.39422400792439777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.01,0.047276800870895384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.01,0.04261760115623474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,balanced,0.032373333970705666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,balanced,0.3115520079930623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.01,0.047628799080848695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,power_law_1.01,0.028940799832344054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.01,0.04239999949932098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,balanced,0.032773333291212715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.01,0.05850239992141724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,power_law_1.01,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.01,0.04376319944858551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,balanced,0.034143999218940735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,balanced,0.48068265120188397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.01,0.061510401964187625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,power_law_1.01,0.030822399258613586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.01,0.04394879937171936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,balanced,0.03294399877389272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,balanced,0.35528000195821124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.01,0.04848639965057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,power_law_1.01,0.031193599104881287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.01,0.043507200479507444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.01,0.0494271993637085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,power_law_1.01,0.03296639919281006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.01,0.04394879937171936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,balanced,0.6125706831614176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.01,0.05199360251426697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,power_law_1.01,0.033164799213409424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,balanced,0.47579201062520343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.01,0.044198399782180785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.01,0.053446400165557864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,power_law_1.01,0.036268800497055054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,balanced,0.04031466692686081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.01,0.04433279931545257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.01,0.06622719764709473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,power_law_1.01,0.037529599666595456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,balanced,0.04088533421357473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.01,0.04838399887084961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,balanced,0.042223999897638954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.01,0.0670527994632721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,power_law_1.01,0.03948799967765808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,balanced,0.9276373386383057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.01,0.05221760272979736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,balanced,0.6857866446177164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.01,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.01,0.06493440270423889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.01,0.07640320062637329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.01,0.07909119725227357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,power_law_1.01,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.01,0.07828480005264282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.01,0.09471359848976135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,power_law_1.01,0.047200000286102294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.01,0.07370240092277527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.01,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,balanced,0.05423999826113383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,power_law_1.01,0.05484799742698669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.01,0.09484800100326538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.01,0.12706559896469116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,balanced,0.05735999842484792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,power_law_1.01,0.06183680295944214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.01,0.10468480587005616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.01,0.11906559467315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.01,0.13861119747161865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,balanced,1.8285387357076008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.01,0.1657663941383362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,balanced,1.3136640389760335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.01,0.16395519971847533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,power_law_1.01,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.01,0.21573760509490966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.01,0.2248703956604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.01,0.30585598945617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,power_law_1.01,0.07336959838867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.01,0.28413441181182864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,balanced,0.07266133526961009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.01,0.3176703929901123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,power_law_1.01,0.09337599873542786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.01,0.37334399223327636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.01,0.48547840118408203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.01,0.5465983867645263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.01,0.5350783824920654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,balanced,0.08355200290679932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.01,0.8263168334960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,power_law_1.01,0.11294080018997192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.01,0.9400704383850098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.01,0.9364352226257324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,power_law_1.01,0.1276927947998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.01,1.1262399673461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.01,1.201356792449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.01,1.4371968269348145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,balanced,0.11133333047231038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.01,1.9492671966552735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,power_law_1.01,0.16773120164871216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.01,2.2670976638793947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.01,3.7082752227783202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,balanced,0.12863999605178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.01,4.063372802734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,power_law_1.01,0.2307391881942749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,16,8,power_law_1.2,0.05059840083122254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,power_law_1.01,0.32330880165100095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,16,8,power_law_1.2,0.044627198576927186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,power_law_1.01,0.3786623954772949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,balanced,0.1959999998410543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,16,8,power_law_1.2,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,power_law_1.01,0.6506239891052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,16,8,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,balanced,0.24873600403467813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,power_law_1.01,0.7959807872772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,16,8,power_law_1.2,0.04620800018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,balanced,0.36797865231831867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,power_law_1.01,1.135200023651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,16,8,power_law_1.2,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,power_law_1.01,1.577337646484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,16,8,power_law_1.2,0.061452800035476686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,balanced,0.4769226710001628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,power_law_1.01,1.8776639938354491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,16,8,power_law_1.2,0.047635200619697574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,power_law_1.01,2.964454460144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,16,8,power_law_1.2,0.04902400076389313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,balanced,0.5903306802113851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,power_law_1.01,5.603699111938477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,16,8,power_law_1.2,0.04999040067195892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,16,8,power_law_1.2,0.052876800298690796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,16,8,power_law_1.2,0.05997440218925476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,16,8,power_law_1.2,0.06502400040626526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,16,8,power_law_1.2,0.07060480117797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,16,8,power_law_1.2,0.04084480106830597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,balanced,0.9333919684092203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,16,8,power_law_1.2,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,16,8,power_law_1.2,0.041152000427246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,16,8,power_law_1.2,0.09548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,16,8,power_law_1.2,0.0412416011095047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,16,8,power_law_1.2,0.09869440197944641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,16,8,power_law_1.2,0.04338560104370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,16,8,power_law_1.2,0.12434560060501099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,16,8,power_law_1.2,0.04229120016098022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,16,8,power_law_1.2,0.12956160306930542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,16,8,power_law_1.2,0.0440064013004303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,16,8,power_law_1.2,0.18028160333633422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,16,8,power_law_1.2,0.0453247994184494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,balanced,1.842890739440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,16,8,power_law_1.2,0.21697280406951905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,16,8,power_law_1.2,0.042931199073791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,16,8,power_law_1.2,0.30977280139923097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,16,8,power_law_1.2,0.04420480132102966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,16,8,power_law_1.2,0.33983359336853025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,16,8,power_law_1.2,0.045484799146652224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,16,8,power_law_1.2,0.505459213256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,16,8,power_law_1.2,0.04630399942398071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,16,8,power_law_1.2,0.627884817123413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,16,8,power_law_1.2,0.04831359982490539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,16,8,power_law_1.2,0.9371135711669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,16,8,power_law_1.2,0.051948797702789304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,16,8,power_law_1.2,1.1610943794250488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,16,8,power_law_1.2,0.06394240260124207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,16,8,power_law_1.2,1.4001983642578124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,16,8,power_law_1.2,0.07986559867858886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,16,8,power_law_1.2,2.229523277282715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,16,8,power_law_1.2,0.08057600259780884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,16,8,power_law_1.2,0.07438079714775085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,16,8,power_law_1.2,4.192300796508789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,16,8,power_law_1.2,0.09281280040740966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,16,8,power_law_1.2,0.10696959495544434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,16,8,power_law_1.2,0.1401087999343872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,16,8,power_law_1.2,0.16298880577087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,16,8,power_law_1.2,0.246995210647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,16,8,power_law_1.2,0.28089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,16,8,power_law_1.2,0.3945280075073242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,16,8,power_law_1.2,0.5228288173675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,16,8,power_law_1.2,0.84967041015625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,16,8,power_law_1.2,1.0283455848693848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,balanced,0.039781334499518074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,16,8,power_law_1.2,1.283993625640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,16,8,power_law_1.2,1.9808832168579102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,balanced,0.03944533318281174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,balanced,0.04353066782156626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,16,8,power_law_1.2,3.752249526977539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,16,8,power_law_1.2,0.029158401489257812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,balanced,0.04622933268547058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,16,8,power_law_1.2,0.029049599170684816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,balanced,0.047824000318845115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,16,8,power_law_1.2,0.029395198822021483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,balanced,0.0499893327554067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,16,8,power_law_1.2,0.030988800525665283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,balanced,0.04910400013128916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,16,8,power_law_1.2,0.031251201033592226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,balanced,0.04986133178075155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,16,8,power_law_1.2,0.03247359991073608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,balanced,0.04984533290068308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,16,8,power_law_1.2,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,balanced,0.04906133313973745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,16,8,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,balanced,0.04922133187452952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,16,8,power_law_1.2,0.037747201323509214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,balanced,0.05067733426888784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,16,8,power_law_1.2,0.03902080059051514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,balanced,0.035717333356539406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,balanced,0.05050133168697357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,balanced,0.03585600107908249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,balanced,0.04320000112056732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,balanced,0.05188799897829691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,16,8,power_law_1.2,0.043033599853515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,balanced,0.04507199923197428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,balanced,0.062362665931383766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,balanced,0.04475200176239014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,16,8,power_law_1.2,0.05431680083274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,balanced,0.03862933317820231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,balanced,0.06144533554712931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,16,8,power_law_1.2,0.05633919835090637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,balanced,0.0396373321612676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,balanced,0.06193066636721293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,balanced,0.039642666776975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,16,8,power_law_1.2,0.06810879707336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,balanced,0.03955200066169103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,balanced,0.0703893353541692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.01,0.045561599731445315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,balanced,0.04083200047413508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,balanced,0.07165866593519847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.01,0.0474047988653183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,balanced,0.04844800134499868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,16,8,power_law_1.2,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,balanced,0.028837333122889202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,balanced,0.09218133489290874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.01,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,balanced,0.048725331823031105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,16,8,power_law_1.2,0.07440639734268188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,balanced,0.09948266545931499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,balanced,0.04854399959246317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,balanced,0.02842666705449422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.01,0.04982399940490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,16,8,power_law_1.2,0.09168639779090881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,balanced,0.04428266485532125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.01,0.05006719827651977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,balanced,0.029487999776999157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,balanced,0.12377599875132243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,balanced,0.04955733319123586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.01,0.06004480123519897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,balanced,0.031290667752424874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,balanced,0.05129600067933401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,balanced,0.16391467054684958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.01,0.06408960223197938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,balanced,0.031045332551002502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,16,8,power_law_1.2,0.10698879957199096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.01,0.05615360140800476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,balanced,0.0681279997030894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,16,8,power_law_1.2,0.14024319648742675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,balanced,0.23717333873112997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,balanced,0.031727999448776245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.01,0.05511040091514587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.01,0.05297920107841492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,balanced,0.07461866736412048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,balanced,0.03285333265860876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.01,0.05249279737472534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,balanced,0.23938133319218954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,balanced,0.09347732861836751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,balanced,0.0325546662012736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.01,0.05380480289459229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,16,8,power_law_1.2,0.19445120096206664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.01,0.05594879984855652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,balanced,0.110042671362559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.01,0.07584000229835511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,balanced,0.367850661277771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,balanced,0.14231466253598532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,16,8,power_law_1.2,0.19598720073699952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.01,0.08387200236320495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,balanced,0.033173332611719765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.01,0.0946943998336792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,balanced,0.17864533265431723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,balanced,0.034058667719364166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.01,0.0883072018623352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,16,8,power_law_1.2,0.3093696117401123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,balanced,0.4417813221613566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.01,0.11667840480804444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,balanced,0.25482134024302167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,16,8,power_law_1.2,0.3871295928955078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.01,0.11537280082702636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.01,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.01,0.14730240106582643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.01,0.037894400954246524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,balanced,0.3030933340390523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.01,0.14962559938430786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,16,8,power_law_1.2,0.6225279808044434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,balanced,0.5688373247782389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.01,0.04099839925765991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.01,0.22344319820404052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,balanced,0.0335413341720899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,16,8,power_law_1.2,0.8096192359924317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.01,0.044377601146698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.01,0.31249279975891114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,balanced,0.4407573143641154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.01,0.4887296199798584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,balanced,0.03429333368937174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.01,0.04377599954605103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,16,8,power_law_1.2,1.1988096237182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.01,0.44077439308166505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.01,0.039443200826644896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,balanced,0.03589333345492681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,16,8,power_law_1.2,1.6018047332763672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.01,0.673689603805542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,balanced,0.035631999373435974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,balanced,0.5587146679560343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.01,0.04046080112457275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,balanced,0.8605759938557943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.01,0.957158374786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,16,8,power_law_1.2,1.909209632873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.01,1.3046015739440917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.01,0.040275201201438904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,16,8,power_law_1.2,3.15295352935791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.01,2.3299455642700195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.01,0.043647998571395875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.01,3.5502784729003904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,balanced,0.703711986541748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.01,0.04191359877586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,16,8,power_law_1.2,6.084921646118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,balanced,0.045168002446492515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.01,0.046751999855041505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.01,0.05002880096435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,balanced,0.045381332437197365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.01,0.049472001194953916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,balanced,0.049253334601720176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.01,0.05740799903869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,balanced,1.084661324818929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,balanced,1.6418399810791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.01,0.06514559984207154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,balanced,0.06283199787139893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.01,0.0720255970954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,balanced,0.06906666855017345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.01,0.07164160013198853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.01,0.09057919979095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,power_law_1.01,0.02858879864215851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.01,0.09470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,balanced,0.08905599514643352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,power_law_1.01,0.028288000822067262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.01,0.12258559465408325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,balanced,2.245349407196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,power_law_1.01,0.029849600791931153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.01,0.16227200031280517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,power_law_1.01,0.031091201305389404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.01,0.2099071979522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,power_law_1.01,0.03132160007953644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,balanced,0.10727999607721965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.01,0.29358720779418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.01,0.4200767993927002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,power_law_1.01,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.01,0.5510079860687256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.01,0.7195519924163818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.01,0.9852160453796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,power_law_1.01,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,balanced,0.1486133337020874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.01,1.1083328247070312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,power_law_1.01,0.038335999846458434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,4,power_law_1.2,0.046112000942230225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.01,1.9953279495239258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,balanced,0.19788267215092978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,4,power_law_1.2,0.04481280148029328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.01,4.687263870239258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,balanced,0.2980159918467204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,power_law_1.01,0.04500479996204376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,4,power_law_1.2,0.046393600106239316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,power_law_1.01,0.05306239724159241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,4,power_law_1.2,0.04999679923057556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,balanced,0.3773386478424072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,power_law_1.01,0.04906879961490631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,4,power_law_1.2,0.050425601005554196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,power_law_1.01,0.05788800120353699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,4,power_law_1.2,0.06039680242538452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,balanced,0.5507626533508301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,4,power_law_1.2,0.06409599781036376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,4,power_law_1.2,0.0531328022480011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,power_law_1.01,0.06833279728889466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,balanced,0.7211466630299886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,4,power_law_1.2,0.05548160076141358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,power_law_1.01,0.07104640007019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,power_law_1.01,0.08895999789237977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,4,power_law_1.2,0.05437440276145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,4,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,balanced,0.8960959911346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,power_law_1.01,0.10648959875106812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,4,power_law_1.2,0.053260797262191774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,power_law_1.01,0.1369472026824951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,4,power_law_1.2,0.06310399770736694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,4,power_law_1.2,0.07196159958839417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,4,power_law_1.2,0.08627200126647949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,power_law_1.01,0.19561599493026732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,balanced,1.4167680740356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,4,power_law_1.2,0.08730239868164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,power_law_1.01,0.2462847948074341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,4,power_law_1.2,0.09512320160865784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,4,power_law_1.2,0.1164736032485962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,4,power_law_1.2,0.12190719842910766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,power_law_1.01,0.30174078941345217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,4,power_law_1.2,0.1526080012321472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,power_law_1.01,0.42215681076049805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,4,power_law_1.2,0.19027199745178222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,power_law_1.01,0.6567808151245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,4,power_law_1.2,0.20702719688415527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,4,power_law_1.2,0.3723200082778931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,power_law_1.01,0.8887040138244628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,balanced,2.809962590535482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,4,power_law_1.2,0.6554111957550048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,power_law_1.01,1.410201644897461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,4,power_law_1.2,0.5688960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,power_law_1.01,2.050067138671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,4,power_law_1.2,0.961843204498291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,power_law_1.01,2.3467967987060545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,4,power_law_1.2,1.0608448028564452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,power_law_1.01,4.0389057159423825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,4,power_law_1.2,1.1836031913757323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,power_law_1.01,8.599129486083985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,4,power_law_1.2,2.365260887145996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,4,power_law_1.2,4.744927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,4,power_law_1.2,0.03683840036392212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,4,power_law_1.2,0.03749760091304779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,4,power_law_1.2,0.04103679955005646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,4,power_law_1.2,0.04431360065937042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,4,power_law_1.2,0.028479999303817748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,4,power_law_1.2,0.043961599469184875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,4,power_law_1.2,0.02863360047340393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,4,power_law_1.2,0.03916159868240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,4,power_law_1.2,0.029465600848197937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,4,power_law_1.2,0.040300801396369934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,4,power_law_1.2,0.030675199627876282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,4,power_law_1.2,0.040268799662590025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,4,power_law_1.2,0.03107840120792389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,4,power_law_1.2,0.04332799911499023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,4,power_law_1.2,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,4,power_law_1.2,0.0434112012386322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,4,power_law_1.2,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,4,power_law_1.2,0.035872000455856326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,4,power_law_1.2,0.04859519898891449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,4,power_law_1.2,0.04986880123615265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,4,power_law_1.2,0.03829120099544525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,4,power_law_1.2,0.04924159944057464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,4,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,4,power_law_1.2,0.05856639742851257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,4,power_law_1.2,0.06926720142364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,4,power_law_1.2,0.06401280164718628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,4,power_law_1.2,0.07461760044097901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,4,power_law_1.2,0.04520959854125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,4,power_law_1.2,0.09210240244865417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,4,power_law_1.2,0.04981119930744171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,4,power_law_1.2,0.11004159450531006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,4,power_law_1.2,0.048403200507164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,4,power_law_1.2,0.12772480249404908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,4,power_law_1.2,0.06474239826202392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,4,power_law_1.2,0.16376320123672486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,4,power_law_1.2,0.21413760185241698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,4,power_law_1.2,0.31778559684753416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,4,power_law_1.2,0.07560319900512695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,4,power_law_1.2,0.44625282287597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,4,power_law_1.2,0.06930559873580933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,4,power_law_1.2,0.5716991901397706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,4,power_law_1.2,0.09815040230751038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,4,power_law_1.2,0.829094409942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,4,power_law_1.2,1.073408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,4,power_law_1.2,0.09800959825515747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,4,power_law_1.2,1.3629631996154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,4,power_law_1.2,0.13509759902954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,4,power_law_1.2,2.3443456649780274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,4,power_law_1.2,0.1789247989654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,4,power_law_1.2,4.157625579833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,balanced,0.11809600392977397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,balanced,0.1901599963506063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,4,power_law_1.2,0.2377023935317993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,balanced,0.1141973336537679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,balanced,0.18979199727376303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,balanced,0.119077334801356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,balanced,0.19088532527287802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,balanced,0.1222773293654124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,4,power_law_1.2,0.3876352071762085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,balanced,0.19987734158833823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,4,power_law_1.2,0.5164671897888183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,balanced,0.12289599577585857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,balanced,0.1984000007311503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,4,power_law_1.2,0.5864768028259277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,balanced,0.20129066705703735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,balanced,0.34493335088094074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,4,power_law_1.2,0.7567872047424317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,balanced,0.20320000251134238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,balanced,0.3652106523513794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,4,power_law_1.2,1.4435392379760743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,balanced,0.19880000750223795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,balanced,0.35944533348083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,4,power_law_1.2,2.070047950744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,balanced,0.34177064895629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,balanced,0.20359466473261514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,4,power_law_1.2,2.879743957519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,balanced,0.3498826821645101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,balanced,0.2068586746851603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,balanced,0.35948801040649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,4,power_law_1.2,4.285433578491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,balanced,0.21151467164357504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,balanced,0.3432106574376424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,4,power_law_1.2,7.414771270751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,balanced,0.21077867348988852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,balanced,0.34770135084788006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,balanced,0.21248000860214233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,balanced,0.3378346761067708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,balanced,0.3559733231862386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,balanced,0.21287999550501505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,balanced,0.3643626769383748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,balanced,0.21567465861638388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,balanced,0.36760000387827557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,balanced,0.2143626610438029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,balanced,0.33769067128499347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,balanced,0.2175146738688151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,balanced,0.05634133517742157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,balanced,0.3386666774749756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,balanced,0.2262293299039205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,balanced,0.05362666646639506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,balanced,0.33269866307576496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,balanced,0.2360960046450297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,balanced,0.05685866872469584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,balanced,0.058229332168896995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,balanced,0.33275200923283893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,balanced,0.24194665749867758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,balanced,0.06192533175150553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,balanced,0.07314133147398631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,balanced,0.2595573266347249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,balanced,0.3193173408508301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,balanced,0.07454933226108551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,balanced,0.07525333265463512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,balanced,0.07523199915885925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,balanced,0.2629706660906474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,balanced,0.26311467091242474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,balanced,0.0761653333902359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,balanced,0.07707733412583669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,balanced,0.07712533573309581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,balanced,0.07890133559703827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,balanced,0.08002666632334392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,balanced,0.5766400098800659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,balanced,0.45837334791819256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,balanced,0.08659199873606364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,balanced,0.08611200253168742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,balanced,0.08965866764386494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.33832321166992185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,balanced,0.4841333230336507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,balanced,0.4660746653874715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.33977599143981935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.3122560024261475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,balanced,0.09773332873980205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.2756864070892334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.3514303922653198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.3526400089263916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.2025984048843384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.3567296028137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,balanced,0.6701280275980631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,balanced,0.7256906827290853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.19048320055007933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.3490560054779053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.20062720775604248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.37016959190368653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,balanced,0.10637866457303365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,power_law_1.01,0.06681600213050842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.19651199579238893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.34408318996429443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,balanced,0.12075199683507283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.202239990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.3293247938156128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.2001471996307373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.3344448089599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,power_law_1.01,0.06356480121612548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,balanced,0.131632000207901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.19866880178451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.3267263889312744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,power_law_1.01,0.07118719816207886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.2026815891265869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,power_law_1.01,0.07200639843940734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.32140800952911375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,balanced,0.9480906327565511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,balanced,0.8706506888071696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.20714240074157714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,power_law_1.01,0.07342720031738281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.31407999992370605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,power_law_1.01,0.07376639842987061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.19392000436782836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.2992511987686157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.19100159406661987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,power_law_1.01,0.07475839853286743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.2790015935897827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.19095679521560668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,power_law_1.01,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.38862080574035646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,balanced,0.15982932845751444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,power_law_1.01,0.07622399926185608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.1968127965927124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.4253824234008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,power_law_1.01,0.07854719758033753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.19241600036621093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.5140223979949952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,power_law_1.01,0.08042880296707153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,balanced,0.18314667542775473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.18918399810791015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.5403840065002441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,power_law_1.01,0.08160640001296997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.18122880458831786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.01,0.8870079994201661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,balanced,1.1607946554819744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,balanced,1.07424529393514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,power_law_1.01,0.09633280038833618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.1793984055519104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.01,1.1834815979003905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,power_law_1.01,0.1044543981552124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,balanced,0.23778132597605386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.2252863883972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.01,1.702796745300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,power_law_1.01,0.11308799982070923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.2488192081451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.3160896062850952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,power_law_1.01,0.1244928002357483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.01,2.124985694885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.3602688074111938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.01,3.304492950439453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,balanced,0.28756266832351685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,power_law_1.01,0.15123200416564941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.550438404083252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.01,4.587116622924805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.609881591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,1.0231488227844239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.01,0.142739200592041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.01,5.194854354858398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,1.3490495681762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.01,0.1892416000366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,1.9311616897583008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.01,10.253388977050781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.01,0.2386240005493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,2.957881546020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.33549439907073975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.01,0.2860095977783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.01,3.3364734649658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,balanced,1.8989760080973308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,balanced,0.40580801169077557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,balanced,1.7036959330240886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.01,24.978060913085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.01,0.4204991817474365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.33863680362701415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.01,5.320940780639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.3104576110839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.01,0.5574272155761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.3412224054336548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.01,0.6491583824157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.33943679332733157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.01,11.897913360595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.34760959148406984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.35072638988494875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.01,1.081503963470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.3492863893508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.01,1.2628352165222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.3412735939025879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,balanced,0.5197813510894775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.34926719665527345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.33320319652557373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.32884480953216555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.3227839946746826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,power_law_1.01,1.9687744140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.31499519348144533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.2965440034866333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.01,2.8911615371704102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.28280959129333494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.3023103952407837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,128,power_law_1.2,0.20427520275115968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.01,5.6564289093017575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.3846271991729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,128,power_law_1.2,0.19151999950408935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.5537024021148682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,128,power_law_1.2,0.1675647974014282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.7284480094909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,balanced,0.6490346590677897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,128,power_law_1.2,0.19591679573059081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.8844672203063965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,128,power_law_1.2,0.19937920570373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,128,power_law_1.2,1.1104512214660645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,128,power_law_1.2,0.19530240297317505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,128,power_law_1.2,1.4982399940490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,128,power_law_1.2,0.2005376100540161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,128,power_law_1.2,2.361075210571289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,128,power_law_1.2,0.20574719905853273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,128,power_law_1.2,3.4702335357666017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,128,power_law_1.2,0.1891711950302124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,128,power_law_1.2,0.19449599981307983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,128,power_law_1.2,6.735897827148437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,128,power_law_1.2,0.19575040340423583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,128,power_law_1.2,9.566802978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,128,power_law_1.2,0.19294079542160034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,balanced,3.9066718419392905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,balanced,3.474485397338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,128,power_law_1.2,0.1923583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,128,power_law_1.2,12.047142028808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,128,power_law_1.2,0.18789119720458985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,128,power_law_1.2,0.1778880000114441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,128,power_law_1.2,0.18769919872283936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,128,power_law_1.2,18.10401306152344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,128,power_law_1.2,0.2109055995941162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,balanced,1.0125439961751301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,128,power_law_1.2,0.2609472036361694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,128,power_law_1.2,0.29038081169128416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,128,power_law_1.2,0.3846271991729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,128,power_law_1.2,44.645068359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,128,power_law_1.2,0.516761589050293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,128,power_law_1.2,0.6016448020935059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,128,power_law_1.2,0.9063872337341309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,128,power_law_1.2,1.6576448440551759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,128,power_law_1.2,2.0181503295898438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,128,power_law_1.2,3.2636032104492188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,128,power_law_1.2,4.578694534301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,128,power_law_1.2,5.5425151824951175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,128,power_law_1.2,10.501753234863282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,128,power_law_1.2,24.506790161132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,balanced,2.041696071624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,128,power_law_1.2,0.06718720197677612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,128,power_law_1.2,0.06615679860115051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,128,power_law_1.2,0.055955201387405396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,balanced,0.1204159955183665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,128,power_law_1.2,0.0716159999370575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,128,power_law_1.2,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,balanced,0.11500799655914307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,128,power_law_1.2,0.07363200187683105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,128,power_law_1.2,0.07359359860420227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,balanced,0.12005333105723064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,128,power_law_1.2,0.07541120052337646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,balanced,0.12194133798281352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,128,power_law_1.2,0.07553279995918274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,balanced,0.2010879913965861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,balanced,0.3715733289718628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,128,power_law_1.2,0.07691519856452941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,balanced,0.07729599873224895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,balanced,0.3700480063756307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,128,power_law_1.2,0.08024960160255432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,balanced,0.08030400176843007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,balanced,0.37382400035858154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,128,power_law_1.2,0.08246399760246277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,balanced,0.07861333092053731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,balanced,0.3628693421681722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,128,power_law_1.2,0.0898751974105835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,balanced,0.07915199796358745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,balanced,0.36429866154988605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,128,power_law_1.2,0.09584640264511109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,balanced,0.12967466314633688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,balanced,0.3527359962463379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,128,power_law_1.2,0.1041152000427246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,balanced,0.21693867444992065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,balanced,0.3686399857203166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,128,power_law_1.2,0.12267520427703857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,balanced,0.2118133306503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,balanced,0.35786668459574383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,balanced,0.21532267332077026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,128,power_law_1.2,0.13634560108184815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,balanced,0.35790932178497314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,balanced,0.21566933393478394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,balanced,0.36267733573913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,128,power_law_1.2,0.18099839687347413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,balanced,0.22143999735514322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,balanced,0.3552639881769816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,balanced,0.22028799851735434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,balanced,0.37037865320841473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,balanced,0.223855992158254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,balanced,0.3598879973093669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.2,0.1743232011795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,balanced,0.21859200795491537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,balanced,0.20490666230519614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.2,0.2371903896331787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,balanced,0.3428853352864583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,balanced,0.2190986673037211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.2,0.28142080307006834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,balanced,0.3487093448638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,balanced,0.21094399690628052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,balanced,0.21306133270263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,balanced,0.33791999022165936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,balanced,0.23278933763504028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.2,0.4308608055114746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.01,0.3503232002258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,balanced,0.2237386703491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.2,0.5119679927825928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,balanced,0.3163680036862691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.01,0.3686784029006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.2,0.7528319835662842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,balanced,0.24086399873097739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.01,0.3268160104751587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.2,0.9869183540344239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,balanced,0.2814133365948995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,balanced,0.2485226591428121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.01,0.21374719142913817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.01,0.2184704065322876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.2,1.5878080368041991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.01,0.20549120903015136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.01,0.2632512092590332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,balanced,0.27331199248631793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.01,0.16839679479598998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.2,1.9033472061157226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,balanced,0.5747306744257609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.01,0.13585920333862306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,balanced,0.044938668608665466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.01,0.31630079746246337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.01,0.16243200302124022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,balanced,0.2768373290697734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,balanced,0.04560533165931702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.01,0.19482239484786987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,128,power_law_1.2,2.8206655502319338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.01,0.290720009803772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.01,0.20421760082244872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,balanced,0.04593066871166229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.01,0.3388351917266846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.01,0.20071680545806886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,balanced,0.04762133459250132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.2,4.429478454589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,balanced,0.5035786628723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,balanced,0.061754668752352394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.01,0.20787839889526366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.01,0.3120255947113037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,balanced,0.4706186850865682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,balanced,0.07452799876530965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.01,0.20112640857696534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.01,0.3379199981689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,balanced,0.0751146674156189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.01,0.21151359081268312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.2,13.363072204589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,balanced,0.07617599765459697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.01,0.20373759269714356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.01,0.34955520629882814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,balanced,0.07618133227030437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.01,0.18995200395584105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.01,0.33791360855102537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,balanced,0.07674666742483775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.01,0.19534080028533934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,balanced,0.48336533705393475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,balanced,0.07761066655317943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.01,0.19080959558486937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.01,0.3380160093307495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,balanced,0.7180266380310059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.01,0.19765119552612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,balanced,0.07855466504891713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.01,0.34371199607849123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.01,0.1973312020301819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,balanced,0.0803413341442744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.01,0.20300159454345704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.01,0.3217087984085083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,balanced,0.08172266681989034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.01,0.2611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.01,0.33260159492492675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,balanced,0.08741866548856099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.01,0.31658880710601806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.01,0.3197824001312256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.01,0.3685760021209717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,balanced,0.6954452991485596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,balanced,0.08753599723180135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.01,0.5221695899963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.01,0.4038400173187256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,power_law_1.01,0.0741823971271515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,balanced,0.09179733196894328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.01,0.5906688213348389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,balanced,0.9398773511250814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.01,0.39064960479736327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,power_law_1.01,0.06805760264396668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.01,0.815833568572998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,64,power_law_1.2,0.3577280044555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,power_law_1.01,0.058719998598098753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.01,0.4630720138549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.01,1.054924774169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,power_law_1.01,0.05911039710044861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,64,power_law_1.2,0.36550400257110593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,balanced,0.10042132933934529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,power_law_1.01,0.06895999908447266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,64,power_law_1.2,0.1602687954902649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.01,1.457759952545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.01,0.5440256118774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,power_law_1.01,0.06863999962806702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,64,power_law_1.2,0.21000959873199462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,balanced,0.9073920249938965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.01,0.7321856021881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.01,1.912883186340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,power_law_1.01,0.07212799787521362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,64,power_law_1.2,0.22577919960021972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,64,power_law_1.2,0.24936320781707763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.01,0.904428768157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,power_law_1.01,0.07455360293388366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.01,2.4198335647583007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,64,power_law_1.2,0.3001535892486572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,power_law_1.01,0.07402240037918091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.01,1.1975808143615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,64,power_law_1.2,0.3362175941467285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,balanced,0.10891733566919963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,power_law_1.01,0.07634559869766236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.01,4.322092819213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,balanced,1.1812907059987385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.01,1.5159232139587402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,64,power_law_1.2,0.3249408006668091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,power_law_1.01,0.07428479790687562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,64,power_law_1.2,0.3283071994781494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,balanced,0.12450133760770161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.01,2.687539291381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,power_law_1.01,0.08104959726333619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.01,9.13486099243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,64,power_law_1.2,0.34793601036071775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,64,power_law_1.2,0.3136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,power_law_1.01,0.07939199805259704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,balanced,0.13773866494496664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.01,3.175129508972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,64,power_law_1.2,0.32683520317077636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,power_law_1.01,0.08731520175933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,balanced,1.1212053298950195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.01,3.8888320922851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,64,power_law_1.2,0.313369607925415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,power_law_1.01,0.09855999946594238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,64,power_law_1.2,0.34228479862213135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,power_law_1.01,0.1059391975402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.01,6.620851135253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,64,power_law_1.2,0.33018879890441893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,power_law_1.01,0.1121216058731079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,64,power_law_1.2,0.3971519947052002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,64,power_law_1.2,0.406982421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.01,13.8051513671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,power_law_1.01,0.1379263997077942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,64,power_law_1.2,0.4028736114501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,balanced,0.16791999340057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,64,power_law_1.2,0.5815872192382813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,power_law_1.01,0.1410431981086731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,64,power_law_1.2,0.6398143768310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,balanced,0.19545066356658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,balanced,1.914357344309489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,power_law_1.01,0.17299840450286866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,64,power_law_1.2,1.0366911888122559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,power_law_1.01,0.21756160259246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,64,power_law_1.2,1.1179776191711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,64,power_law_1.2,1.6924415588378907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,balanced,0.2602399984995524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,64,power_law_1.2,2.6433855056762696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,balanced,1.7762719790140789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,64,power_law_1.2,3.713753509521484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,power_law_1.01,0.26362879276275636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,64,power_law_1.2,4.772102355957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,power_law_1.01,0.36602880954742434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,balanced,0.31612799564997357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,power_law_1.01,0.5490176200866699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,64,power_law_1.2,7.731295776367188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,power_law_1.01,0.6508992195129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,64,power_law_1.2,10.321363067626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,power_law_1.2,24.714373779296874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,power_law_1.01,0.9709312438964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,balanced,0.4618613322575887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,power_law_1.01,1.4116415977478027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,power_law_1.01,1.6870527267456055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,power_law_1.01,2.744691276550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,balanced,0.5985600153605143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,power_law_1.01,5.202406311035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,64,balanced,3.936730702718099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,balanced,3.6447200775146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,balanced,0.7508587042490641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,balanced,1.1495893001556396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,64,power_law_1.2,0.2182528018951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,64,power_law_1.2,0.20470399856567384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,64,power_law_1.2,0.11622400283813476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,64,power_law_1.2,0.13408639430999755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,64,power_law_1.2,0.1526528000831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,64,power_law_1.2,0.16186239719390869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,64,power_law_1.2,0.2081216096878052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,64,power_law_1.2,0.2060352087020874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,64,power_law_1.2,0.17366399765014648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,64,power_law_1.2,0.19985920190811157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,64,power_law_1.2,0.17592959403991698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,64,power_law_1.2,0.20432000160217284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,64,power_law_1.2,0.2102207899093628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,64,power_law_1.2,0.20151679515838622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,64,power_law_1.2,0.18736640214920045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,64,power_law_1.2,0.19737600088119506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,64,power_law_1.2,0.21101438999176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,64,power_law_1.2,0.2501120090484619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,64,power_law_1.2,0.2791167974472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,64,power_law_1.2,0.3677567958831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,64,power_law_1.2,0.42892160415649416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,64,power_law_1.2,0.07512959837913513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,64,power_law_1.2,0.5875520229339599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,64,power_law_1.2,0.7183040142059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,64,power_law_1.2,0.06815360188484192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,64,power_law_1.2,0.9696831703186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,64,power_law_1.2,0.054688000679016115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,balanced,0.0577706644932429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,64,power_law_1.2,1.3921792030334472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,64,power_law_1.2,0.05811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,balanced,0.056554665168126426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,balanced,2.3003199895222983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,64,power_law_1.2,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,balanced,0.05596266686916351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,64,power_law_1.2,2.0900415420532226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,64,power_law_1.2,0.06921600103378296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,balanced,0.06381866832574208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,64,power_law_1.2,3.1374847412109377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,64,power_law_1.2,0.07272319793701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,balanced,0.07669333120187123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,64,power_law_1.2,0.07097600102424621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,balanced,0.10644267002741496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,64,power_law_1.2,3.3131454467773436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,64,power_law_1.2,0.07685120105743408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,balanced,0.10686399539311726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,64,power_law_1.2,0.07490559816360473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,balanced,0.10711466272672017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,64,power_law_1.2,7.437229156494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,64,power_law_1.2,0.08085119724273682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,balanced,0.10706667105356853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,64,power_law_1.2,0.0784704029560089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,balanced,0.10769066214561462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,64,power_law_1.2,0.08111360073089599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,64,power_law_1.2,14.3240966796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,balanced,0.1090880036354065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,64,power_law_1.2,0.0908735990524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,balanced,0.10944533348083496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,64,power_law_1.2,0.10368640422821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,balanced,0.11059199770291646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,balanced,0.049285332361857094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,balanced,0.11473066608111064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,64,power_law_1.2,0.10611840486526489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,balanced,0.0487306664387385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,balanced,0.12123200297355652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,64,power_law_1.2,0.12709759473800658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,balanced,0.048672000567118325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,balanced,0.12185600399971008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,balanced,0.05203733344872793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,balanced,0.12109866738319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,64,power_law_1.2,0.17274880409240723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,balanced,0.05877333382765452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,balanced,0.07817066709200542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,balanced,0.13148799538612366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,balanced,0.0802400012811025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,balanced,0.1350933313369751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,balanced,0.08107733229796092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,64,power_law_1.2,0.1662783980369568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,balanced,0.08238400022188823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,balanced,0.14979199568430582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,balanced,0.08269333342711131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,64,power_law_1.2,0.19815679788589477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,balanced,0.08453333377838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,64,power_law_1.2,0.26362879276275636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,balanced,0.1662879983584086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,balanced,0.084906667470932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,balanced,0.08667733271916707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,64,power_law_1.2,0.37772159576416015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,balanced,0.1891253391901652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,balanced,0.08815466364224751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,64,power_law_1.2,0.49555201530456544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,64,power_law_1.2,0.7074111938476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,balanced,0.09473066528638203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,balanced,0.2164799968401591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,balanced,0.09544000029563904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,64,power_law_1.2,0.9238143920898437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,balanced,0.1011840005715688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,64,power_law_1.2,1.6229440689086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.01,0.12332160472869873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,balanced,0.1123253305753072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,balanced,0.28310932715733844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,64,power_law_1.2,1.7921855926513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.01,0.10819200277328492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,balanced,0.12367467085520427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.01,0.0884607970714569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,64,power_law_1.2,2.2086015701293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,balanced,0.1450399955113729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.01,0.07276800274848938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,64,power_law_1.2,3.885676956176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.01,0.07928320169448852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,balanced,0.33712534109751385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,balanced,0.1633333365122477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,balanced,0.04500266909599304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.01,0.08744320273399353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.01,0.07883520126342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,balanced,0.045610666275024414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,64,power_law_1.2,8.816409301757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,balanced,0.2037866711616516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.01,0.09689599871635438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.01,0.07054719924926758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,balanced,0.04565866788228353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.01,0.09756799936294555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.01,0.06101120114326477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,balanced,0.04819199939568838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.01,0.09671040177345276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,balanced,0.24234666426976523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,balanced,0.059952000776926674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.01,0.060070401430130003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.01,0.10612479448318482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,balanced,0.44415998458862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,balanced,0.07564266522725423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.01,0.062015998363494876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.01,0.09756799936294555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,balanced,0.07685866455237071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.01,0.06632320284843445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,balanced,0.0772159993648529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.01,0.10644479990005493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,balanced,0.32438933849334717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.01,0.07512320280075073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,balanced,0.0783679982026418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.01,0.10625920295715333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.01,0.07576320171356202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,balanced,0.07865599791208903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.01,0.11367039680480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,balanced,0.0802293320496877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.01,0.07534719705581665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.01,0.126528000831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,balanced,0.08107733229796092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.01,0.07807999849319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,balanced,0.4096693197886149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.01,0.12340480089187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,balanced,0.08250666658083598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.01,0.07768319845199585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,balanced,0.5841493209203085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.01,0.12407679557800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,balanced,0.08408000071843465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.01,0.08273919820785522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,balanced,0.09082667032877605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.01,0.1450495958328247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.01,0.08331519961357117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,balanced,0.09092266360918681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.01,0.15576959848403932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.01,0.1901695966720581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.01,0.09522560238838196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,balanced,0.09505599737167358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,balanced,0.5704426765441895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.01,0.09639679789543151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.01,0.2065279960632324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.01,0.10713599920272827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.01,0.2900160074234009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.01,0.11950080394744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.01,0.30820479393005373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,balanced,0.10573333501815796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.01,0.13406720161437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.01,0.42255358695983886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,balanced,0.7227679888407389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.01,0.17034239768981935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.01,0.49927678108215334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.01,0.19351680278778077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.01,0.6873727798461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.01,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,balanced,0.7270293235778809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.01,0.30655999183654786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.01,0.9409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,balanced,0.11622400085131328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.01,0.39502720832824706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.01,1.2012031555175782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.01,0.5272640228271485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,balanced,0.1341973344484965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.01,0.7449151992797851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.01,1.7885120391845704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,balanced,0.14995200435320535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.01,1.027731227874756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.01,3.623078536987305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.01,1.2770624160766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.01,1.9327808380126954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,balanced,0.9156959851582845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.01,3.893900680541992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,balanced,0.18872000773747763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,balanced,1.0058133602142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,balanced,0.22105065981547037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,balanced,0.3104106585184733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,power_law_1.01,0.07939839959144593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,power_law_1.01,0.07225599884986877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,power_law_1.01,0.06391680240631104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,balanced,0.391487995783488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,power_law_1.01,0.056428802013397214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,power_law_1.01,0.06500480175018311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,balanced,1.400752067565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,power_law_1.01,0.06812160015106201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,power_law_1.01,0.07370880246162415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,power_law_1.01,0.07329919934272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,power_law_1.01,0.0765824019908905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,32,power_law_1.2,0.12845439910888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,power_law_1.01,0.07783039808273315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,32,power_law_1.2,0.10904959440231324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,power_law_1.01,0.08095359802246094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,32,power_law_1.2,0.07241600155830383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,power_law_1.01,0.08389760255813598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,32,power_law_1.2,0.07115520238876342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,power_law_1.01,0.08521599769592285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,32,power_law_1.2,0.0787775993347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,power_law_1.01,0.08789759874343872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,balanced,0.5761653184890747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,32,power_law_1.2,0.08060160279273987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,power_law_1.01,0.09880959987640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,32,power_law_1.2,0.10109440088272095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,power_law_1.01,0.10502400398254394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,32,power_law_1.2,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,power_law_1.01,0.11804800033569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,32,power_law_1.2,0.09879040122032165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,32,power_law_1.2,0.09586560130119323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,power_law_1.01,0.14204800128936768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,32,power_law_1.2,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,balanced,1.9739093780517578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,32,power_law_1.2,0.10028159618377686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,32,power_law_1.2,0.11044479608535766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,power_law_1.01,0.13868160247802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,balanced,0.7381066481272379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,32,power_law_1.2,0.10882560014724732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,power_law_1.01,0.18474240303039552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,32,power_law_1.2,0.1260800004005432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,32,power_law_1.2,0.13409279584884642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,power_law_1.01,0.21928319931030274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,32,power_law_1.2,0.12981760501861572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,32,power_law_1.2,0.16298240423202515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,32,power_law_1.2,0.16929279565811156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,power_law_1.01,0.30891520977020265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,32,power_law_1.2,0.21972479820251464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,32,power_law_1.2,0.2306879997253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,power_law_1.01,0.40285439491271974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,32,power_law_1.2,0.32965118885040284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,power_law_1.01,0.5582335948944092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,32,power_law_1.2,0.36558079719543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,balanced,2.7291946411132812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,32,power_law_1.2,0.5154560089111329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,power_law_1.01,0.7577727794647217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,32,power_law_1.2,0.07640320062637329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,32,power_law_1.2,0.6070591926574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,32,power_law_1.2,0.9775679588317872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,32,power_law_1.2,0.0758463978767395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,balanced,0.9250666300455729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,32,power_law_1.2,1.3644800186157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,power_law_1.01,1.1297792434692382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,32,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,32,power_law_1.2,1.4208255767822267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,32,power_law_1.2,0.057068800926208495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,power_law_1.01,1.4168959617614747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,32,power_law_1.2,2.4460031509399416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,32,power_law_1.2,0.06282240152359009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,32,power_law_1.2,0.06555520296096802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,power_law_1.01,2.015283203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,32,power_law_1.2,4.790508651733399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,32,power_law_1.2,0.07179520130157471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,power_law_1.01,2.758963203430176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,32,power_law_1.2,0.07624319791793824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,32,power_law_1.2,0.07708160281181335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,power_law_1.01,5.717951965332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,32,power_law_1.2,0.07638400197029113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,32,power_law_1.2,0.08091520071029663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,32,power_law_1.2,0.07971839904785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,32,power_law_1.2,0.08516479730606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,balanced,1.4254345893859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,32,power_law_1.2,0.0893887996673584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,32,power_law_1.2,0.09520000219345093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,32,power_law_1.2,0.1035647988319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,32,power_law_1.2,0.10716160535812377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,32,power_law_1.2,0.1313599944114685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,32,power_law_1.2,0.13731839656829833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,32,power_law_1.2,0.18174079656600953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,32,power_law_1.2,0.2315135955810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,32,power_law_1.2,0.2722368001937866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,32,power_law_1.2,0.3322175979614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,32,power_law_1.2,0.46053118705749513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,32,power_law_1.2,0.6091263771057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,32,power_law_1.2,0.8063936233520508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,32,power_law_1.2,1.141868782043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,32,power_law_1.2,1.4446399688720704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,32,power_law_1.2,0.08072320222854615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,32,power_law_1.2,2.2077823638916017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,32,power_law_1.2,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,32,power_law_1.2,0.048588800430297854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,balanced,0.05537599821885427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,32,power_law_1.2,5.237593460083008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,32,power_law_1.2,0.05947520136833191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,32,power_law_1.2,0.06219519972801209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,balanced,0.05651199817657471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,32,power_law_1.2,0.0646399974822998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,balanced,0.06566933294137318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,32,power_law_1.2,0.07125759720802308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,balanced,0.07667733232180278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,32,power_law_1.2,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,balanced,2.8392906188964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,balanced,0.10752532879511516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,32,power_law_1.2,0.07701119780540466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,balanced,0.10840533177057902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,32,power_law_1.2,0.07722880244255066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,balanced,0.10815999905268352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,32,power_law_1.2,0.08010240197181702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,balanced,0.1086293359597524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,32,power_law_1.2,0.08218880295753479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,balanced,0.1090880036354065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,balanced,0.10947199662526448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,32,power_law_1.2,0.08538240194320679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,balanced,0.11123200257619222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,32,power_law_1.2,0.09152640104293823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,balanced,0.1116426686445872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,32,power_law_1.2,0.10241279602050782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,balanced,0.11429867148399353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,32,power_law_1.2,0.10746239423751831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,balanced,0.11989333232243855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,32,power_law_1.2,0.12603520154953002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,balanced,0.12220266461372375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,balanced,0.12742933630943298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,32,power_law_1.2,0.14384000301361083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,balanced,0.13550933202107748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,balanced,0.14548800388971964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,balanced,0.04779199759165446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,32,power_law_1.2,0.15104000568389891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,balanced,0.164383997519811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,balanced,0.04891733328501383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,32,power_law_1.2,0.19724160432815552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,balanced,0.04868266483147939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,32,power_law_1.2,0.2511039972305298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,balanced,0.17507733901341757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,balanced,0.05301866432030996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,balanced,0.06151466568311056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,balanced,0.0802346666653951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,balanced,0.21317867437998453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,balanced,0.08224000036716461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,32,power_law_1.2,0.38131840229034425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,balanced,0.08206933240095775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,32,power_law_1.2,0.5663296222686768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,balanced,0.08388266960779826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,balanced,0.24699199199676514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,balanced,0.08348799745241801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,32,power_law_1.2,0.6728000164031982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,balanced,0.08533866206804912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,32,power_law_1.2,0.893619155883789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,balanced,0.08604266246159871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,balanced,0.3187626600265503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,balanced,0.08928533395131429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,balanced,0.09053867061932881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,32,power_law_1.2,1.4747648239135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,balanced,0.09714667002360027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,32,power_law_1.2,1.6892992019653321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,balanced,0.09964799880981445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,balanced,0.39274664719899494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,balanced,0.10519466797510783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,balanced,0.1188213328520457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,32,power_law_1.2,2.321638488769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,balanced,0.13313600420951843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,32,power_law_1.2,3.795635223388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,balanced,0.15597333510716757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,32,power_law_1.2,8.127302551269532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,balanced,0.5309546788533529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,balanced,0.17748800913492838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,balanced,0.04580266773700714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,balanced,0.04628799855709076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,balanced,0.2213653326034546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,balanced,0.04737600187460581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.01,0.08551040291786194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,balanced,0.051669334371884666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,balanced,0.06460266808668773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.01,0.11299840211868287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,balanced,0.07826666533946991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,balanced,0.2696266571680705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,balanced,0.08083733419577281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.01,0.06392959952354431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,balanced,0.08133333424727122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.01,0.07084800004959106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,balanced,0.0819893330335617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,balanced,0.684607982635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,balanced,0.08285333216190338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.01,0.06935679912567139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.01,0.07236480116844177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,balanced,0.08428800106048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,balanced,0.3606559832890828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,balanced,0.08644800384839375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.01,0.07963520288467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.01,0.07850239872932434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,balanced,0.08809066812197368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.01,0.05551360249519348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.01,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,balanced,0.08924266695976257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.01,0.05777919888496399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.01,0.09930880069732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,balanced,0.09733333190282185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.01,0.09603840112686157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.01,0.05937280058860779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,balanced,0.4631466468175252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.01,0.10273280143737792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,balanced,0.09754666686058044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.01,0.06811519861221313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.01,0.09971200227737427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,balanced,0.10406933228174846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.01,0.07392640113830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.01,0.10576640367507935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.01,0.10368640422821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.01,0.07371519804000855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,balanced,0.8623572985331217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.01,0.10597120523452759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.01,0.07708799839019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,balanced,0.12065600355466206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.01,0.11996159553527833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.01,0.07811840176582337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.01,0.1270591974258423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.01,0.08227199912071229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,balanced,0.6575946807861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.01,0.0815999984741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.01,0.127948796749115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.01,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.01,0.1456704020500183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.01,0.08926720023155213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.01,0.15869439840316774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.01,0.09807999730110169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,balanced,0.13710400462150574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.01,0.1850111961364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.01,0.10348800420761109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.01,0.11068160533905029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,balanced,0.16241600116093954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.01,0.12880640029907225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.01,0.2685631990432739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.01,0.1410048007965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.01,0.33615999221801757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.01,0.1771456003189087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,balanced,0.8413653373718262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,balanced,0.179584006468455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.01,0.41824002265930177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.01,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.01,0.5373311996459961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.01,0.2642496109008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.01,0.3268224000930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.01,0.7447936058044433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.01,0.450764799118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,balanced,1.2550559838612874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,balanced,0.24420799811681113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.01,0.5954495906829834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.01,1.0088831901550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.01,0.8654463768005372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.01,1.2030464172363282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.01,1.0402432441711427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,balanced,0.30027733246485394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.01,1.8907072067260742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.01,1.3406975746154786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,power_law_1.01,0.06792320013046264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.01,3.5734718322753904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,balanced,1.0626239776611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.01,2.0401279449462892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,power_law_1.01,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,balanced,0.43729066848754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.01,4.184748840332031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,power_law_1.01,0.0546176016330719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,16,power_law_1.2,0.08536319732666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,power_law_1.01,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,power_law_1.01,0.06415359973907471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,16,power_law_1.2,0.10114560127258301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,balanced,0.5421173175175985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,power_law_1.01,0.07117440104484558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,16,power_law_1.2,0.06726400256156921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,power_law_1.01,0.07612800002098083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,16,power_law_1.2,0.06880000233650208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,power_law_1.01,0.07711359858512878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,16,power_law_1.2,0.0742464005947113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,power_law_1.01,0.0769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,power_law_1.01,0.08081279993057251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,16,power_law_1.2,0.07790079712867737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,power_law_1.01,0.08428800106048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,16,power_law_1.2,0.08951680064201355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,16,power_law_1.2,0.09397760033607483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,power_law_1.01,0.08647680282592773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,16,power_law_1.2,0.09470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,power_law_1.01,0.09117439985275269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,16,power_law_1.2,0.09591680169105529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,balanced,1.5931946436564128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,power_law_1.01,0.09637759923934937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,balanced,0.7900586922963461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,16,power_law_1.2,0.10068479776382447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,power_law_1.01,0.10612479448318482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,16,power_law_1.2,0.09975680112838745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,power_law_1.01,0.1131775975227356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,16,power_law_1.2,0.1045375943183899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,power_law_1.01,0.12743680477142333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,16,power_law_1.2,0.11282559633255004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,16,power_law_1.2,0.12264319658279418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,power_law_1.01,0.14890240430831908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,16,power_law_1.2,0.1311360001564026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,balanced,2.417978604634603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,16,power_law_1.2,0.1295359969139099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,balanced,1.0140586694081624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,power_law_1.01,0.16248320341110228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,16,power_law_1.2,0.15457279682159425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,16,power_law_1.2,0.16457600593566896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,power_law_1.01,0.2032639980316162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,power_law_1.01,0.2741503953933716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,16,power_law_1.2,0.21305599212646484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,16,power_law_1.2,0.23719680309295654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,power_law_1.01,0.4095295906066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,16,power_law_1.2,0.28469760417938234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,power_law_1.01,0.5193600177764892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,16,power_law_1.2,0.33880319595336916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,power_law_1.01,0.6442624092102051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,16,power_law_1.2,0.5227392196655274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,power_law_1.01,0.9329983711242675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,16,power_law_1.2,0.6428927898406982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,balanced,1.264346679051717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,power_law_1.01,1.1667263984680176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,16,power_law_1.2,0.9396479606628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,power_law_1.01,1.6504831314086914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,16,power_law_1.2,1.145644760131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,power_law_1.01,2.165798377990723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,16,power_law_1.2,1.485318374633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,power_law_1.01,3.3422657012939454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,16,power_law_1.2,2.509177589416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,power_law_1.01,7.058643341064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,16,power_law_1.2,6.233472061157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,balanced,3.1438185373942056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,16,power_law_1.2,0.06647679805755616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,16,power_law_1.2,0.07271680235862732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,balanced,1.9682614008585613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,16,power_law_1.2,0.05306879878044128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,16,power_law_1.2,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,16,power_law_1.2,0.058899199962615965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,16,power_law_1.2,0.06469759941101075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,16,power_law_1.2,0.07243520021438599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,16,power_law_1.2,0.07491199970245362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,16,power_law_1.2,0.0777728021144867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,16,power_law_1.2,0.07824640274047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,16,power_law_1.2,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,16,power_law_1.2,0.08407679796218873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,16,power_law_1.2,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,16,power_law_1.2,0.09322879910469055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,16,power_law_1.2,0.10046720504760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,16,power_law_1.2,0.10729600191116333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,16,power_law_1.2,0.10951039791107178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,16,power_law_1.2,0.134662401676178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,16,power_law_1.2,0.15273599624633788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,16,power_law_1.2,0.19567999839782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,16,power_law_1.2,0.22272639274597167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,16,power_law_1.2,0.2858112096786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,16,power_law_1.2,0.34858880043029783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,balanced,3.91481081644694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,16,power_law_1.2,0.5132415771484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,16,power_law_1.2,0.6497856140136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,16,power_law_1.2,0.9957056045532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,16,power_law_1.2,0.06493440270423889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,16,power_law_1.2,1.3973119735717774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,16,power_law_1.2,0.08000640273094177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,16,power_law_1.2,1.5174079895019532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,16,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,16,power_law_1.2,2.6511552810668944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,16,power_law_1.2,0.058271998167037965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,balanced,0.05598933498064677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,16,power_law_1.2,0.062483197450637816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,16,power_law_1.2,5.2609600067138675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,balanced,0.05569600065549215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,16,power_law_1.2,0.06649600267410279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,16,power_law_1.2,0.07484800219535828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,balanced,0.057674666245778404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,16,power_law_1.2,0.07824640274047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,balanced,0.06604800124963124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,16,power_law_1.2,0.07978240251541138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,balanced,0.07810666660467784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,16,power_law_1.2,0.08081920146942138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,balanced,0.10956266522407532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,16,power_law_1.2,0.0852735996246338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,balanced,0.1104746659596761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,16,power_law_1.2,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,balanced,0.11282666524251302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,16,power_law_1.2,0.09014400243759155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,16,power_law_1.2,0.10442880392074586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,balanced,0.1132533351580302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,16,power_law_1.2,0.11208959817886352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,balanced,0.11413333813349406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,16,power_law_1.2,0.11794559955596924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,balanced,0.11500266194343567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,16,power_law_1.2,0.13254400491714477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,balanced,0.11620799700419109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,balanced,0.11713600158691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,16,power_law_1.2,0.15624959468841554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,balanced,0.11973866820335388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,balanced,0.12568533420562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,balanced,0.12812266747156778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,balanced,0.0480320006608963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,16,power_law_1.2,0.16728960275650023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,balanced,0.13338667154312134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,balanced,0.04833599925041199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,16,power_law_1.2,0.22945919036865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,balanced,0.1487679978211721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,16,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,balanced,0.050426666935284935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,balanced,0.05495999753475189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,balanced,0.16873600085576376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,16,power_law_1.2,0.440012788772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,balanced,0.06864533325036366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,16,power_law_1.2,0.5803711891174317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,balanced,0.08829866846402486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,balanced,0.18424532810846964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,16,power_law_1.2,0.7616127967834473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,balanced,0.089519997437795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,16,power_law_1.2,0.9478976249694824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,balanced,0.0902239978313446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,balanced,0.21042132377624512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,balanced,0.09119466940561931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,16,power_law_1.2,1.3496640205383301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,balanced,0.09175999959309895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,balanced,0.09364266196886699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,balanced,0.2563839952150981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,16,power_law_1.2,2.0103296279907226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,balanced,0.09363733728726704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,16,power_law_1.2,2.470579147338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,balanced,0.09646933277448018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,balanced,0.09816533327102661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,16,power_law_1.2,4.435424041748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,balanced,0.3078879912694295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,balanced,0.107013334830602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,16,power_law_1.2,9.305439758300782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,balanced,0.10924800237019856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,balanced,0.11602133512496948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,balanced,0.4142666657765706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,balanced,0.1317759950955709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,balanced,0.14938666423161825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,balanced,0.1747466723124186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,balanced,0.5276159842809042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,balanced,0.20270933707555136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.01,0.06683520078659058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.01,0.05415679812431336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,balanced,0.26478399833043414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.01,0.07994880080223084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.01,0.06630399823188782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.01,0.06236799955368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.01,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,balanced,0.3256160020828247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,balanced,0.7392640113830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.01,0.07559040188789368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.01,0.058406400680541995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.01,0.0732096016407013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.01,0.06538879871368408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,balanced,0.0484746644894282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.01,0.0692351996898651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.01,0.0818943977355957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,balanced,0.05091733237107595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,balanced,0.4519146680831909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.01,0.07850880026817322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.01,0.09282559752464295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,balanced,0.05300266544024149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.01,0.08177279829978942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.01,0.08097919821739197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,balanced,0.058415999015172325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.01,0.09649279713630676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.01,0.08128640055656433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,balanced,0.07193600138028462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.01,0.0834879994392395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.01,0.10346239805221558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,balanced,0.09462400277455647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.01,0.08971520066261292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,balanced,0.5820480187733968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,balanced,0.09332799911499023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,balanced,0.9224853515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.01,0.09497600197792053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.01,0.10131839513778687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,balanced,0.09489599863688152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.01,0.10160000324249267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,balanced,0.09571733077367146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.01,0.1047935962677002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,balanced,0.09714133540789287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.01,0.10986239910125732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,balanced,0.0999840001265208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.01,0.11507840156555176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.01,0.10640640258789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,balanced,0.10079466303189595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.01,0.12099839448928833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.01,0.14398720264434814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,balanced,0.1048479974269867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.01,0.11149439811706544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,balanced,0.8386666774749756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.01,0.1548416018486023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,balanced,0.10689600308736165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.01,0.11930240392684936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.01,0.1903167963027954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,balanced,0.11699733138084412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.01,0.13126399517059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.01,0.22773759365081786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,balanced,0.1200320025285085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.01,0.30741760730743406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.01,0.13552000522613525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,balanced,1.1598986784617107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,balanced,0.12783466776212057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.01,0.3921087980270386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.01,0.13948800563812255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.01,0.5511807918548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.01,0.15705599784851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.01,0.6832831859588623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,balanced,0.14891200264294943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.01,0.1769536018371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.01,0.9885824203491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,balanced,1.0533920129140217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.01,0.21381759643554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.01,1.3060992240905762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.01,0.2224639892578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.01,1.526905632019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.01,0.3096127986907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.01,2.584486389160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.01,0.34313600063323973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,balanced,0.17675199111302695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,power_law_1.01,0.061510401964187625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.01,5.396185684204101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.01,0.49458560943603513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,balanced,0.22459733486175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,power_law_1.01,0.07197440266609192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.01,0.6198783874511719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,power_law_1.01,0.05501440167427063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.01,0.9153535842895508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,balanced,0.26265599330266315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,power_law_1.01,0.06289280056953431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,balanced,1.331173340479533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.01,1.247436809539795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,power_law_1.01,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,balanced,1.7147199312845867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,power_law_1.01,0.07822080254554749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.01,1.3956543922424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,8,power_law_1.2,0.06652160286903382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,power_law_1.01,0.08685439825057983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.01,2.3077056884765623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,balanced,0.3722453514734904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,power_law_1.01,0.0883903980255127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,8,power_law_1.2,0.07996159791946411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,power_law_1.01,0.08782079815864563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.01,4.211129760742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,balanced,0.4482453266779582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,power_law_1.01,0.09467520117759705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,8,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,power_law_1.01,0.09872639775276185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,8,power_law_1.2,0.07559679746627808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,power_law_1.01,0.10277760028839111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,power_law_1.01,0.10714880228042603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,balanced,0.6601706743240356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,8,power_law_1.2,0.07048320174217224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,power_law_1.01,0.11444480419158935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,8,power_law_1.2,0.07610880136489868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,power_law_1.01,0.12634880542755128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,8,power_law_1.2,0.09117439985275269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,power_law_1.01,0.1406399965286255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,balanced,2.0170507431030273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,balanced,0.8210453192392985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,8,power_law_1.2,0.09534080028533935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,power_law_1.01,0.15741440057754516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,8,power_law_1.2,0.09313920140266418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,8,power_law_1.2,0.10011520385742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,power_law_1.01,0.18554879426956178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,8,power_law_1.2,0.10440959930419921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,8,power_law_1.2,0.10933120250701904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,balanced,1.205888032913208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,8,power_law_1.2,0.10889600515365601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,power_law_1.01,0.21317119598388673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,power_law_1.01,0.2791935920715332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,8,power_law_1.2,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,power_law_1.01,0.35469439029693606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,8,power_law_1.2,0.13044480085372925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,8,power_law_1.2,0.13528319597244262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,power_law_1.01,0.5073344230651855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,8,power_law_1.2,0.14141440391540527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,8,power_law_1.2,0.16953599452972412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,power_law_1.01,0.5814655780792236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,8,power_law_1.2,0.18773119449615477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,power_law_1.01,0.8876480102539063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,8,power_law_1.2,0.22490239143371582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,power_law_1.01,1.1914560317993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,balanced,1.5808746019999187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,8,power_law_1.2,0.2546367883682251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,power_law_1.01,1.619820785522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,8,power_law_1.2,0.3186944007873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,balanced,3.3354241053263345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,8,power_law_1.2,0.38040320873260497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,power_law_1.01,2.21978874206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,8,power_law_1.2,0.5425920009613037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,8,power_law_1.2,0.7276095867156982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,power_law_1.01,2.638502311706543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,8,power_law_1.2,1.0733183860778808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,8,power_law_1.2,0.053881597518920896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,power_law_1.01,4.36071662902832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,8,power_law_1.2,1.361638355255127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,8,power_law_1.2,0.06609280109405517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,8,power_law_1.2,0.0507968008518219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,8,power_law_1.2,1.714463996887207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,power_law_1.01,9.305894470214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,balanced,1.9669013023376465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,8,power_law_1.2,0.05631359815597534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,8,power_law_1.2,0.06375679969787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,8,power_law_1.2,2.672492790222168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,8,power_law_1.2,0.0670144021511078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,balanced,3.9856961568196616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,8,power_law_1.2,6.293107223510742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,8,power_law_1.2,0.07656319737434387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,8,power_law_1.2,0.08124160170555114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,8,power_law_1.2,0.07923840284347534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,8,power_law_1.2,0.08413439989089966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,8,power_law_1.2,0.0866752028465271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,8,power_law_1.2,0.09089919924736023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,8,power_law_1.2,0.09353600144386291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,8,power_law_1.2,0.10069760084152221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,balanced,3.0843254725138345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,8,power_law_1.2,0.11230720281600952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,8,power_law_1.2,0.11773439645767211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,8,power_law_1.2,0.12318719625473022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,8,power_law_1.2,0.15274879932403565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,8,power_law_1.2,0.16865919828414916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,8,power_law_1.2,0.20015358924865723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,8,power_law_1.2,0.2507456064224243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,8,power_law_1.2,0.3113215923309326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,8,power_law_1.2,0.39969279766082766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,8,power_law_1.2,0.5503424167633056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,8,power_law_1.2,0.740934419631958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,8,power_law_1.2,1.0429632186889648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,8,power_law_1.2,1.427660846710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,8,power_law_1.2,1.8126144409179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,8,power_law_1.2,2.9372671127319334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,8,power_law_1.2,6.329849624633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,8,power_law_1.2,0.061913597583770755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,8,power_law_1.2,0.06869120001792908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,balanced,6.142389297485352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,8,power_law_1.2,0.05556480288505554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,8,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,8,power_law_1.2,0.06968960165977478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,8,power_law_1.2,0.0750976026058197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,8,power_law_1.2,0.08558080196380616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,8,power_law_1.2,0.08836479783058167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,8,power_law_1.2,0.08977919816970825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,balanced,0.055871998270352684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,8,power_law_1.2,0.09413120150566101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,balanced,0.05691199998060862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,8,power_law_1.2,0.09934080243110657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,balanced,0.05904000004132589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,8,power_law_1.2,0.10479999780654907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,balanced,0.08416533470153809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,balanced,0.09640000263849895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,8,power_law_1.2,0.10734720230102539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,balanced,0.1272640029589335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,8,power_law_1.2,0.11786880493164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,balanced,0.12779200077056885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,8,power_law_1.2,0.13127039670944213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,balanced,0.1301866670449575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,8,power_law_1.2,0.13963520526885986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,balanced,0.13056000073750815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,8,power_law_1.2,0.16624640226364135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,balanced,0.131221334139506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,balanced,0.13270399967829385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,8,power_law_1.2,0.1931391954421997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,balanced,0.13619200388590494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,balanced,0.13740799824396768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,balanced,0.1430239975452423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,8,power_law_1.2,0.23502719402313232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,balanced,0.1476479967435201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,balanced,0.15503999590873718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,8,power_law_1.2,0.34072959423065186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,balanced,0.16049599647521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,8,power_law_1.2,0.4048960208892822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,balanced,0.1715466578801473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,balanced,0.04956266780694326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,8,power_law_1.2,0.5121024131774903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,balanced,0.20492800076802573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,balanced,0.051674668987592064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,8,power_law_1.2,0.6676032066345214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,balanced,0.05414933462937673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,balanced,0.23029333353042603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,8,power_law_1.2,1.0821760177612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,balanced,0.060458665092786155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,balanced,0.27349867423375446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,8,power_law_1.2,1.297920036315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,balanced,0.07879466811815898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,balanced,0.10900266965230306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,balanced,0.35092798868815106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,8,power_law_1.2,1.8517759323120118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,balanced,0.11030399799346924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,8,power_law_1.2,2.455353546142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,balanced,0.11071999867757161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,balanced,0.4434826771418254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,balanced,0.1136799951394399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,8,power_law_1.2,3.015519905090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,balanced,0.11286933223406474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,balanced,0.11577600240707397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,8,power_law_1.2,4.687871932983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,balanced,0.11888532837231953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,balanced,0.6155573527018229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,balanced,0.12012799580891927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,balanced,0.12460800011952718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,8,power_law_1.2,10.893580627441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,balanced,0.13154666622479758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,balanced,0.13428800304730734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,balanced,0.7954933643341064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,balanced,0.14203733205795288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.01,0.052985602617263795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.01,0.07864959836006165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,balanced,0.16104533274968466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.01,0.06639999747276307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.01,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.01,0.056601601839065555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,balanced,0.1899413267771403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.01,0.06536319851875305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.01,0.07466239929199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.01,0.07269759774208069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,balanced,0.2306506633758545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,balanced,1.1466506322224934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.01,0.08545920252799988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.01,0.08244479894638061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.01,0.09384959936141968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.01,0.0943615972995758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,balanced,0.25754133860270184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.01,0.09664639830589294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.01,0.11030399799346924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.01,0.09901440143585205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,balanced,0.3490826686223348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.01,0.11409280300140381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.01,0.09906560182571411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.01,0.1150272011756897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.01,0.10535039901733398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.01,0.11734399795532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.01,0.11235840320587158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,balanced,0.4466506640116374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.01,0.12717440128326415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.01,0.11809279918670654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,balanced,1.3547412554423015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.01,0.1322175979614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.01,0.12616959810256959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.01,0.13960319757461548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.01,0.13760000467300415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.01,0.1526528000831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.01,0.1450368046760559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,balanced,0.6321653525034586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.01,0.14935679435729982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.01,0.16343040466308595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.01,0.18558720350265503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.01,0.17199360132217406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.01,0.2028287887573242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.01,0.16150399446487426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.01,0.2671871900558472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.01,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.01,0.30371201038360596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.01,0.20685439109802245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,balanced,0.8234986464182535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.01,0.37918078899383545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.01,0.26569600105285646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.01,0.4887360095977783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,balanced,1.7660266558329265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.01,0.29285759925842286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.01,0.6928256034851075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.01,0.399782395362854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.01,0.9454784393310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.01,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.01,1.3810624122619628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.01,0.6861055850982666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,balanced,1.2087573210398357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.01,1.6379583358764649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.01,0.9062272071838379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.01,2.079232025146484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.01,1.3502592086791991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.01,1.6909503936767578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.01,3.4573631286621094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.01,1.8965824127197266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.01,7.141184234619141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.01,3.045907211303711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.01,6.807974243164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,balanced,1.4789387385050456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,balanced,2.597930590311686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,4,power_law_1.2,0.05883520245552063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,4,power_law_1.2,0.07467520236968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,4,power_law_1.2,0.061337602138519284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,4,power_law_1.2,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,4,power_law_1.2,0.0814848005771637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,balanced,1.9015572865804036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,4,power_law_1.2,0.09408640265464782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,4,power_law_1.2,0.10661120414733886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,4,power_law_1.2,0.11101440191268921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,4,power_law_1.2,0.11344000101089477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,4,power_law_1.2,0.1202623963356018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,4,power_law_1.2,0.12845439910888673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,4,power_law_1.2,0.13463040590286254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,4,power_law_1.2,0.1373568058013916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,4,power_law_1.2,0.15660159587860106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,4,power_law_1.2,0.16398719549179078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,4,power_law_1.2,0.17457280158996583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,4,power_law_1.2,0.1673792004585266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,4,power_law_1.2,0.21242880821228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,balanced,2.9024054209391275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,4,power_law_1.2,0.21902079582214357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,4,power_law_1.2,0.27299840450286866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,4,power_law_1.2,0.31223039627075194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,4,power_law_1.2,0.41690878868103026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,balanced,5.126330693562825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,4,power_law_1.2,0.5283135890960693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,4,power_law_1.2,0.7259967803955079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,4,power_law_1.2,0.9878720283508301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,4,power_law_1.2,1.2808128356933595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,4,power_law_1.2,1.7433792114257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,4,power_law_1.2,2.072211265563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,4,power_law_1.2,3.7837055206298826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,4,power_law_1.2,7.394207763671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,4,power_law_1.2,0.05361279845237732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,4,power_law_1.2,0.06646400094032287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,4,power_law_1.2,0.05371519923210144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,4,power_law_1.2,0.06320639848709106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,4,power_law_1.2,0.07219200134277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,4,power_law_1.2,0.07813119888305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,4,power_law_1.2,0.09168000221252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,4,power_law_1.2,0.09450240135192871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,balanced,5.768138885498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,4,power_law_1.2,0.097324800491333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,4,power_law_1.2,0.09916160106658936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,4,power_law_1.2,0.107750403881073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,4,power_law_1.2,0.11184639930725097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,4,power_law_1.2,0.11880960464477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,4,power_law_1.2,0.12807040214538573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,4,power_law_1.2,0.13626879453659058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,4,power_law_1.2,0.1519744038581848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,4,power_law_1.2,0.15289599895477296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,4,power_law_1.2,0.1898751974105835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,4,power_law_1.2,0.21599359512329103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,4,power_law_1.2,0.26757121086120605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,4,power_law_1.2,0.30598399639129636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,4,power_law_1.2,0.41571841239929197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,4,power_law_1.2,0.5002560138702392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,4,power_law_1.2,0.7393663883209228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,4,power_law_1.2,0.9939007759094238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,balanced,0.03832533210515976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,4,power_law_1.2,1.404524803161621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,balanced,0.038906666139761605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,4,power_law_1.2,1.9417280197143554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,balanced,0.041008000572522484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,4,power_law_1.2,2.381920051574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,balanced,0.040709334115187325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,balanced,0.04167999823888143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,4,power_law_1.2,3.9424766540527343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,balanced,0.04399999976158142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,balanced,0.04663999875386556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,balanced,0.037104000647862755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,balanced,0.044293334086736046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,4,power_law_1.2,8.18572769165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,balanced,0.04478399952252706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,balanced,0.036303999523321785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,balanced,0.04234666625658671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,balanced,0.041877334316571556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,balanced,0.03734933336575826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,balanced,0.04211199780305227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,balanced,0.03893866638342539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,balanced,0.044154668847719826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,balanced,0.047797332207361855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,balanced,0.03818666686614355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,balanced,0.04818133513132731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,balanced,0.039674667020638786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,balanced,0.0472320020198822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,balanced,0.04057066639264425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,balanced,0.0462719996770223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,balanced,0.04021333406368891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,balanced,0.047151997685432434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,balanced,0.03965333352486292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,balanced,0.045466666420300804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,balanced,0.04078399886687597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,balanced,0.04417066772778829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,balanced,0.0395359992980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,balanced,0.04019733270009359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,balanced,0.04121600091457367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,balanced,0.06157866617043813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,balanced,0.04132800052563349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,balanced,0.04472533365090688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,balanced,0.061349332332611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,balanced,0.04321600000063578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,balanced,0.0432640016078949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,balanced,0.04492799937725067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,balanced,0.07816533247629802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,balanced,0.023024000227451324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,balanced,0.046021332343419395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,balanced,0.023050665855407715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,balanced,0.04881600042184194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,balanced,0.02496533344189326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,balanced,0.02492800106604894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,balanced,0.02621866762638092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,balanced,0.05063466727733612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,balanced,0.026543999711672466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,balanced,0.08959999680519104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,balanced,0.02641066660483678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,balanced,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,balanced,0.026357332865397137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,power_law_1.01,0.03783040046691895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,balanced,0.02701333413521449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,balanced,0.027509334186712902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,balanced,0.027610667049884796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,power_law_1.01,0.037811198830604555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,balanced,0.07987200220425923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,balanced,0.028389332195123036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,power_law_1.01,0.039801600575447085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,balanced,0.028538666665554047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,balanced,0.12198399504025777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,balanced,0.031045332551002502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,power_law_1.01,0.04099839925765991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,power_law_1.01,0.0438400000333786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,balanced,0.030581332743167877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,balanced,0.10219200452168782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,power_law_1.01,0.04305280148983002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,power_law_1.01,0.043647998571395875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,power_law_1.01,0.0430400013923645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,power_law_1.01,0.042131200432777405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,balanced,0.03164800008138021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,power_law_1.01,0.039155200123786926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,power_law_1.01,0.03943040072917938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,balanced,0.12124799688657124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,balanced,0.033359999457995095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,power_law_1.01,0.04028800129890442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,balanced,0.032111999889214836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,balanced,0.14869333306948343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,power_law_1.01,0.03951359987258911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,power_law_1.01,0.048851200938224794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,power_law_1.01,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,power_law_1.01,0.06149119734764099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,power_law_1.01,0.034560000896453856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,power_law_1.01,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,balanced,0.1644480029741923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,balanced,0.037477334340413414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,power_law_1.01,0.03455359935760498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,power_law_1.01,0.08958719968795777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,power_law_1.01,0.0350847989320755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,balanced,0.03736533224582672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,power_law_1.01,0.10002559423446655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,power_law_1.01,0.03681280016899109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,power_law_1.01,0.1244096040725708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,power_law_1.01,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,power_law_1.01,0.16843520402908324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,power_law_1.01,0.25119359493255616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,power_law_1.01,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,balanced,0.18107734123865762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,power_law_1.01,0.3293951988220215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,power_law_1.01,0.03797119855880737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,balanced,0.04399999976158142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,power_law_1.01,0.4841599941253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,power_law_1.01,0.03790720105171204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,balanced,0.20423465967178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,power_law_1.01,0.03707520067691803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,power_law_1.01,0.6223231792449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,balanced,0.049914668003718056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,power_law_1.01,0.038924801349639895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,power_law_1.01,0.8347328186035157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,power_law_1.01,0.02285439968109131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,power_law_1.01,0.03898240029811859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,power_law_1.01,1.4632384300231933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,power_law_1.01,0.03777279853820801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,power_law_1.01,0.022950400412082673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,power_law_1.01,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,power_law_1.01,3.4216766357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,power_law_1.01,0.022995199263095855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,power_law_1.01,0.038726401329040525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,power_law_1.01,0.025139200687408447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,power_law_1.01,0.03937920033931732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,power_law_1.01,0.025209599733352663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,power_law_1.01,0.04472959935665131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,balanced,0.060933331648508705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,power_law_1.01,0.026240000128746034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,balanced,0.24739732344945273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,power_law_1.01,0.02630400061607361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,power_law_1.01,0.026399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,power_law_1.01,0.05381760001182556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,balanced,0.266704003016154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,power_law_1.01,0.02632960081100464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,power_law_1.01,0.05807999968528747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,power_law_1.01,0.026688000559806822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,power_law_1.01,0.07505279779434204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,power_law_1.01,0.02725760042667389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,power_law_1.01,0.08885759711265565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,power_law_1.01,0.027628800272941588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,power_law_1.01,0.11347839832305909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,balanced,0.0718560020128886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,power_law_1.01,0.02794240117073059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,power_law_1.01,0.15192320346832275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,power_law_1.01,0.0293503999710083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,power_law_1.01,0.03222399950027466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,power_law_1.01,0.20612480640411376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,power_law_1.01,0.03409920036792755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,power_law_1.01,0.2862720012664795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,power_law_1.01,0.40166401863098145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,power_law_1.01,0.5527743816375732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,power_law_1.01,0.04289920032024384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,power_law_1.01,0.6589503765106202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,power_law_1.01,0.05066879987716675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,balanced,0.3726026614507039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,power_law_1.01,0.06213759779930115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,power_law_1.01,1.1479807853698731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,balanced,0.09477333227793376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,power_law_1.01,0.0642687976360321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,power_law_1.01,2.4738304138183596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,power_law_1.01,0.084934401512146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,1,128,power_law_1.2,0.03948160111904144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,power_law_1.01,0.09159039855003356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,power_law_1.01,0.1310271978378296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,1,128,power_law_1.2,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,1,128,power_law_1.2,0.04208639860153198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,1,128,power_law_1.2,0.03407360017299652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,power_law_1.01,0.1617408037185669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,1,128,power_law_1.2,0.04245119988918304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,1,128,power_law_1.2,0.03402239978313446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,1,128,power_law_1.2,0.04242559969425201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,1,128,power_law_1.2,0.033452799916267394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,balanced,0.11638399958610535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,1,128,power_law_1.2,0.036051198840141296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,1,128,power_law_1.2,0.043315199017524716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,power_law_1.01,0.2027967929840088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,balanced,0.5036106506983439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,1,128,power_law_1.2,0.042668798565864564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,1,128,power_law_1.2,0.035776001214981076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,1,128,power_law_1.2,0.04259200096130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,1,128,power_law_1.2,0.03720960021018982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,1,128,power_law_1.2,0.0427264004945755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,1,128,power_law_1.2,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,power_law_1.01,0.3124351978302002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,1,128,power_law_1.2,0.03854719996452331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,1,128,power_law_1.2,0.04221439957618713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,1,128,power_law_1.2,0.03811199963092804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,1,128,power_law_1.2,0.04016000032424927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,power_law_1.01,0.41724162101745604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,1,128,power_law_1.2,0.03871999979019165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,1,128,power_law_1.2,0.04041599929332733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,1,128,power_law_1.2,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,1,128,power_law_1.2,0.03982079923152924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,1,128,power_law_1.2,0.038873600959777835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,1,128,power_law_1.2,0.04088320136070252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,1,128,power_law_1.2,0.03852159976959228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,1,128,power_law_1.2,0.048767998814582825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,1,128,power_law_1.2,0.041254401206970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,1,128,power_law_1.2,0.052211201190948485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,balanced,0.706175963083903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,1,128,power_law_1.2,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,balanced,0.13847466309865317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,power_law_1.01,0.526035213470459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,1,128,power_law_1.2,0.055871999263763426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,1,128,power_law_1.2,0.04575360119342804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,power_law_1.01,0.8825663566589356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,1,128,power_law_1.2,0.06654719710350036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,1,128,power_law_1.2,0.05173119902610779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,1,128,power_law_1.2,0.07776640057563781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,1,128,power_law_1.2,0.05756160020828247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,power_law_1.01,1.6599744796752929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,1,128,power_law_1.2,0.0691968023777008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,1,128,power_law_1.2,0.10011520385742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,1,128,power_law_1.2,0.07988479733467102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,1,128,power_law_1.2,0.13201919794082642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,1,128,power_law_1.2,0.1093440055847168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,1,128,power_law_1.2,0.20010240077972413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,1,128,power_law_1.2,0.15935360193252562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,1,128,power_law_1.2,0.2710400104522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,1,128,power_law_1.2,0.19267840385437013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,1,128,power_law_1.2,0.35567359924316405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,1,128,power_law_1.2,0.28942720890045165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,1,128,power_law_1.2,0.49097599983215334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,1,128,power_law_1.2,0.3831935882568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,1,128,power_law_1.2,0.8011136054992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,1,128,power_law_1.2,0.5658304214477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,balanced,0.20567999283472696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,1,128,power_law_1.2,1.0651647567749023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,1,128,power_law_1.2,0.7517439842224121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,1,128,power_law_1.2,1.4032064437866212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,1,128,power_law_1.2,0.9766271591186524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,1,128,power_law_1.2,2.4038015365600587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,1,128,power_law_1.2,1.5360639572143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,1,128,power_law_1.2,4.9422657012939455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,1,128,power_law_1.2,3.095974349975586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,1,128,power_law_1.2,0.0225600004196167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,1,128,power_law_1.2,0.022867199778556824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,1,128,power_law_1.2,0.02279040068387985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,1,128,power_law_1.2,0.02456959933042526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,balanced,0.38461331526438397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,1,128,power_law_1.2,0.024851199984550477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,1,128,power_law_1.2,0.02598400115966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,1,128,power_law_1.2,0.02600319981575012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,1,128,power_law_1.2,0.026335999369621277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,1,128,power_law_1.2,0.02648319900035858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,1,128,power_law_1.2,0.0265855997800827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,1,128,power_law_1.2,0.027244800329208375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,1,128,power_law_1.2,0.028300800919532777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,1,128,power_law_1.2,0.028678399324417115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,1,128,power_law_1.2,0.030419200658798218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,1,128,power_law_1.2,0.03466239869594574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,1,128,power_law_1.2,0.03731200098991394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,1,128,power_law_1.2,0.04867199957370758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,1,128,power_law_1.2,0.061388802528381345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,balanced,0.022805333137512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,1,128,power_law_1.2,0.08028799891471863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,balanced,0.026538667579491932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,1,128,power_law_1.2,0.09186559915542603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,balanced,0.022656001150608063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,1,128,power_law_1.2,0.1071936011314392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,balanced,0.02402666707833608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,balanced,0.0249439999461174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,balanced,0.025818665822347004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,balanced,0.025418666501839954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,1,128,power_law_1.2,0.14247039556503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,balanced,0.025786665578683216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,1,128,power_law_1.2,0.19467519521713256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,balanced,0.026213333010673523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,balanced,0.030960001051425934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,balanced,0.026341333985328674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,balanced,0.026687999566396076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,balanced,0.029018667836983997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,1,128,power_law_1.2,0.2653439998626709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,balanced,0.026767998933792114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,balanced,0.029120000700155895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,balanced,0.02759466568628947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,balanced,0.03173333406448364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,1,128,power_law_1.2,0.31850879192352294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,balanced,0.034346667428811394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,balanced,0.033600000043710075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,balanced,0.03618666778008143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,balanced,0.03369066615899404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,1,128,power_law_1.2,0.49881601333618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,balanced,0.036144000788529716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,balanced,0.03411199897527695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,balanced,0.039733332892258964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,1,128,power_law_1.2,0.6492735862731933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,balanced,0.03408533334732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,balanced,0.03865066667397817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,balanced,0.03454933315515518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,balanced,0.03488533447186152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,1,128,power_law_1.2,0.791596794128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,balanced,0.03565333286921183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,balanced,0.04254400233427683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,1,128,power_law_1.2,1.2614272117614747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,balanced,0.036858665446440377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,balanced,0.04287466903527578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,1,128,power_law_1.2,2.456051254272461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,balanced,0.03872533390919367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,balanced,0.03810133288304011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,balanced,0.05023466547330221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,power_law_1.01,0.02260479927062988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,balanced,0.0397119993964831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,power_law_1.01,0.025721600651741026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,balanced,0.0401653324564298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,balanced,0.04957866668701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,power_law_1.01,0.02215680032968521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,balanced,0.04144533226887385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,power_law_1.01,0.023443199694156647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,balanced,0.044821331898371376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,balanced,0.06463466584682465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,power_law_1.01,0.024940800666809083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,balanced,0.047541335225105286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,balanced,0.02332266668478648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,power_law_1.01,0.025248000025749208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,balanced,0.02319466571013133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,balanced,0.0645653357108434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,power_law_1.01,0.025536000728607178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,balanced,0.02329600105683009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,balanced,0.025306666890780132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,power_law_1.01,0.029651200771331786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,balanced,0.06622399886449178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,balanced,0.025519999365011852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,power_law_1.01,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,balanced,0.026837334036827087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,balanced,0.0713919997215271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,power_law_1.01,0.03160319924354553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,balanced,0.027093333502610523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,power_law_1.01,0.03210879862308502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,balanced,0.026575999955336254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,power_law_1.01,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,balanced,0.026848000784715016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,balanced,0.02769600103298823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,power_law_1.01,0.037376001477241516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,balanced,0.08985066413879395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,balanced,0.027834666272004444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,power_law_1.01,0.03803519904613495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,balanced,0.08561066786448161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,balanced,0.02794666588306427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,power_law_1.01,0.04097920060157776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,balanced,0.028751999139785767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,power_law_1.01,0.04286719858646393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,balanced,0.02917333443959554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,power_law_1.01,0.05110399723052979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,balanced,0.03176533430814743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,power_law_1.01,0.06867200136184692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,balanced,0.10409067074457805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,power_law_1.01,0.07668480277061462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,balanced,0.031125334401925404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,power_law_1.01,0.0908352017402649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,power_law_1.01,0.11101440191268921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,power_law_1.01,0.14924800395965576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,balanced,0.09523199995358785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,power_law_1.01,0.20955519676208495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,balanced,0.03190933416287104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,power_law_1.01,0.03155199885368347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,power_law_1.01,0.22940800189971924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,balanced,0.034416000048319496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,power_law_1.01,0.02943359911441803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,balanced,0.13952533404032388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,power_law_1.01,0.35019519329071047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,power_law_1.01,0.029382398724555968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,power_law_1.01,0.02282879948616028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,power_law_1.01,0.5246335983276367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,balanced,0.033301333586374916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,power_law_1.01,0.03193599879741669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,power_law_1.01,0.022444799542427063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,power_law_1.01,0.9798591613769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,power_law_1.01,0.03345920145511627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,power_law_1.01,0.02481919974088669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,power_law_1.01,0.033055999875068666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,power_law_1.01,0.025574401021003723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,balanced,0.038933334251244865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,power_law_1.01,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,power_law_1.01,0.02630400061607361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,balanced,0.11122133334477742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,balanced,0.16742400328318277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,power_law_1.01,0.02661119997501373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,power_law_1.01,0.034016001224517825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,balanced,0.03958933303753535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,power_law_1.01,0.02693760097026825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,power_law_1.01,0.033990401029586795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,power_law_1.01,0.027014398574829103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,power_law_1.01,0.03573760092258453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,power_law_1.01,0.02725760042667389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,power_law_1.01,0.03537920117378235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,power_law_1.01,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,power_law_1.01,0.027807998657226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,64,power_law_1.2,0.022892799973487855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,power_law_1.01,0.0377344012260437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,power_law_1.01,0.028832000494003297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,balanced,0.04706666866938273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,64,power_law_1.2,0.02588160037994385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,power_law_1.01,0.04036479890346527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,power_law_1.01,0.02892799973487854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,64,power_law_1.2,0.022195200622081756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,power_law_1.01,0.04089600145816803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,64,power_law_1.2,0.02366719990968704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,power_law_1.01,0.03061760067939758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,balanced,0.054474666714668274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,balanced,0.19963733355204263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,power_law_1.01,0.04227840006351471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,64,power_law_1.2,0.024563199281692503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,power_law_1.01,0.033881598711013795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,64,power_law_1.2,0.025407999753952026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,power_law_1.01,0.047193598747253415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,power_law_1.01,0.03490560054779053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,64,power_law_1.2,0.02510719895362854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,power_law_1.01,0.048307201266288756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,64,power_law_1.2,0.029452800750732422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,power_law_1.01,0.05797119736671448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,64,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,power_law_1.01,0.0418368011713028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,64,power_law_1.2,0.031123200058937074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,power_law_1.01,0.06892799735069274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,balanced,0.15752533078193665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,64,power_law_1.2,0.03234559893608093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,power_law_1.01,0.04799999892711639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,power_law_1.01,0.09415680170059204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,64,power_law_1.2,0.032678401470184325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,balanced,0.06903466582298279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,64,power_law_1.2,0.03356800079345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,power_law_1.01,0.1074560046195984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,64,power_law_1.2,0.036473599076271054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,power_law_1.01,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,64,power_law_1.2,0.0385919988155365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,power_law_1.01,0.17333120107650757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,power_law_1.01,0.05917440056800842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,64,power_law_1.2,0.038924801349639895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,64,power_law_1.2,0.042419201135635375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,power_law_1.01,0.2571455955505371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,power_law_1.01,0.07088639736175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,64,power_law_1.2,0.04699519872665405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,64,power_law_1.2,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,power_law_1.01,0.28606719970703126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,64,power_law_1.2,0.07726719975471497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,power_law_1.01,0.3448512077331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,balanced,0.08179733157157898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,power_law_1.01,0.09466879963874816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,64,power_law_1.2,0.08967679738998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,balanced,0.29368533690770465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,64,power_law_1.2,0.12243839502334594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,power_law_1.01,0.598195219039917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,power_law_1.01,0.11943039894104004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,64,power_law_1.2,0.1366912007331848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,64,power_law_1.2,0.17017600536346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,power_law_1.01,1.2960831642150878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,64,power_law_1.2,0.23456640243530275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,power_law_1.01,0.16005120277404786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,64,power_law_1.2,0.336844801902771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,64,power_law_1.2,0.41295361518859863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,64,power_law_1.2,0.4887104034423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,power_law_1.01,0.22403199672698976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,64,power_law_1.2,0.8697407722473145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,balanced,0.11016533772150676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,power_law_1.01,0.33773438930511473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,power_law_1.2,2.251942443847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,power_law_1.01,0.42005119323730467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,balanced,0.1355893313884735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,power_law_1.01,0.46827521324157717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,64,balanced,0.2773759961128235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,power_law_1.01,0.8288448333740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,power_law_1.01,1.4551615715026855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,64,power_law_1.2,0.03182080090045929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,64,power_law_1.2,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,64,power_law_1.2,0.029600000381469725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,64,power_law_1.2,0.03224959969520569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,balanced,0.16197866201400757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,balanced,0.543994665145874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,64,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,64,power_law_1.2,0.033215999603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,64,power_law_1.2,0.0333759993314743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,64,power_law_1.2,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,64,power_law_1.2,0.03418239951133728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,64,power_law_1.2,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,64,power_law_1.2,0.03506560027599335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,64,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,64,power_law_1.2,0.03601279854774475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,64,power_law_1.2,0.037920001149177554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,64,power_law_1.2,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,balanced,0.24247467517852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,64,power_law_1.2,0.04127359986305237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,64,power_law_1.2,0.04407039880752563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,64,power_law_1.2,0.0495743989944458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,64,power_law_1.2,0.05127040147781372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,64,power_law_1.2,0.06519039869308471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,64,power_law_1.2,0.08297600150108338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,64,power_law_1.2,0.11682560443878173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,64,power_law_1.2,0.12183040380477905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,64,power_law_1.2,0.19212160110473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,64,power_law_1.2,0.25829119682312013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,64,power_law_1.2,0.33870720863342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,64,power_law_1.2,0.022899200022220612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,64,power_law_1.2,0.4041920185089111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,64,power_law_1.2,0.02268799990415573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,64,power_law_1.2,0.5707071781158447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,64,power_law_1.2,0.022726400196552275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,64,power_law_1.2,0.9499711990356445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,64,power_law_1.2,0.024748800694942473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,64,power_law_1.2,0.025235199928283693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,64,power_law_1.2,2.2013248443603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,64,power_law_1.2,0.02659200131893158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,64,power_law_1.2,0.026822400093078614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,64,power_law_1.2,0.027008000016212463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,64,power_law_1.2,0.027020800113677978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,64,power_law_1.2,0.027539199590682982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,64,power_law_1.2,0.028288000822067262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,64,power_law_1.2,0.028966400027275085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,balanced,0.4845866759618123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,64,power_law_1.2,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,64,power_law_1.2,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,64,power_law_1.2,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,64,power_law_1.2,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,64,power_law_1.2,0.04351359903812409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,64,power_law_1.2,0.05185920000076294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,64,power_law_1.2,0.05998079776763916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,64,power_law_1.2,0.07905920147895813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,64,power_law_1.2,0.10065280199050904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,balanced,0.023919999599456787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,64,power_law_1.2,0.12729599475860595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,balanced,0.021962667504946392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,64,power_law_1.2,0.17411839962005615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,balanced,0.022005334496498108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,balanced,0.02348266790310542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,balanced,0.02421333392461141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,64,power_law_1.2,0.23347198963165283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,balanced,0.025055999557177227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,balanced,0.024847999215126038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,balanced,0.02502399931351344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,64,power_law_1.2,0.32510080337524416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,balanced,0.025706666211287182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,balanced,0.0301706666747729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,balanced,0.025642665723959606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,64,power_law_1.2,0.42517762184143065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,balanced,0.028880000114440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,balanced,0.02611733227968216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,balanced,0.028858666618665058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,balanced,0.026154667139053345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,64,power_law_1.2,0.7414847850799561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,balanced,0.03169599920511246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,balanced,0.02664000044266383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,balanced,0.033914667864640556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,64,power_law_1.2,0.9062848091125488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,balanced,0.03438399980465571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,balanced,0.03562133262554804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,64,power_law_1.2,1.2898495674133301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,balanced,0.03485333422819773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,balanced,0.03561066587766012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,64,power_law_1.2,3.3605823516845703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,balanced,0.03531199942032496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,balanced,0.03993066648642222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,balanced,0.033957332372665405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,balanced,0.03456533451875051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,balanced,0.040218666195869446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,balanced,0.035386666655540466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,balanced,0.04046933352947235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,balanced,0.036330667634805046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,balanced,0.03603200117746989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,balanced,0.041189332803090416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,balanced,0.023157333334287006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,balanced,0.037578667203585304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,balanced,0.022853332261244457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,balanced,0.04452266792456309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,balanced,0.03910933434963226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,balanced,0.023103999594847362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,power_law_1.01,0.02462079972028732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,balanced,0.03886933376391729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,balanced,0.025360000630219776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,power_law_1.01,0.03394559919834137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,balanced,0.05331199864546458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,balanced,0.02571200082699458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,power_law_1.01,0.021875199675559998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,balanced,0.041077333192030586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,power_law_1.01,0.031839999556541446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,balanced,0.02712533374627431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,power_law_1.01,0.021478399634361267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,balanced,0.04134399940570196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,power_law_1.01,0.029728001356124877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,balanced,0.027610667049884796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,power_law_1.01,0.023014399409294128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,balanced,0.05516799787680308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,power_law_1.01,0.03180800080299377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,balanced,0.027072000006834667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,balanced,0.042352000872294106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,power_law_1.01,0.03214719891548157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,power_law_1.01,0.02374400049448013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,balanced,0.027280000348885853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,power_law_1.01,0.033632001280784606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,balanced,0.02805333336194356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,balanced,0.04796266555786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,power_law_1.01,0.024409599602222443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,power_law_1.01,0.03362559974193573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,balanced,0.028389332195123036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,power_law_1.01,0.034860798716545106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,power_law_1.01,0.02454400062561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,balanced,0.0688266654809316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,power_law_1.01,0.03357439935207367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,balanced,0.05051200091838837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,balanced,0.02855466554562251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,power_law_1.01,0.02467840015888214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,power_law_1.01,0.03356159925460815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,balanced,0.029114666084448498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,power_law_1.01,0.029049599170684816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,power_law_1.01,0.034860798716545106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,balanced,0.02961066613594691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,balanced,0.06714666883150737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,power_law_1.01,0.035180801153182985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,power_law_1.01,0.030188798904418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,balanced,0.03279466678698858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,power_law_1.01,0.037241598963737486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,power_law_1.01,0.033369600772857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,balanced,0.07212266822655995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,balanced,0.03230399886767069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,power_law_1.01,0.03889279961585999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,power_law_1.01,0.035123199224472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,balanced,0.0766186664501826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,power_law_1.01,0.04063999950885773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,power_law_1.01,0.03694719970226288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,power_law_1.01,0.041247999668121337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,power_law_1.01,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,power_law_1.01,0.043808001279830935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,power_law_1.01,0.03917439877986908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,power_law_1.01,0.04782080054283142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,power_law_1.01,0.03806079924106598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,balanced,0.03359466542800268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,balanced,0.09717333316802979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,power_law_1.01,0.04991999864578247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,power_law_1.01,0.042028799653053284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,balanced,0.0979306697845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,power_law_1.01,0.04447360038757324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,power_law_1.01,0.058950400352478026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,balanced,0.036389333506425224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,power_law_1.01,0.06875519752502442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,power_law_1.01,0.051641601324081424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,balanced,0.03570133447647095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,power_law_1.01,0.09552000164985656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,power_law_1.01,0.058822399377822875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,power_law_1.01,0.10582400560379028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,power_law_1.01,0.06195840239524841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,balanced,0.11309333642323811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,power_law_1.01,0.14366079568862916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,power_law_1.01,0.08494719862937927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,power_law_1.01,0.18481279611587526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,power_law_1.01,0.08318719863891602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,power_law_1.01,0.2790080070495605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,power_law_1.01,0.11178879737854004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,balanced,0.04206933577855428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,power_law_1.01,0.29678080081939695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,power_law_1.01,0.12918399572372435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,power_law_1.01,0.40032000541687013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,balanced,0.11312533418337505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,power_law_1.01,0.1804095983505249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,balanced,0.04373333354791006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,power_law_1.01,0.6503488063812256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,power_law_1.01,0.23875839710235597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,balanced,0.15428266922632852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,power_law_1.01,1.3249664306640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,power_law_1.01,0.33113598823547363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,power_law_1.01,0.5011136054992675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,balanced,0.053957333167394005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,power_law_1.01,0.9601728439331054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,balanced,0.06404800216356914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,power_law_1.01,0.024383999407291412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,balanced,0.18854933977127075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,balanced,0.13135466972986856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,power_law_1.01,0.02316800057888031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,power_law_1.01,0.02322559952735901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,32,power_law_1.2,0.024505600333213806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,power_law_1.01,0.02529279887676239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,32,power_law_1.2,0.021792000532150267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,power_law_1.01,0.025887998938560485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,balanced,0.08205333352088928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,32,power_law_1.2,0.021817600727081297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,power_law_1.01,0.027167999744415285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,32,power_law_1.2,0.023212799429893495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,power_law_1.01,0.027404800057411194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,32,power_law_1.2,0.023769600689411162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,power_law_1.01,0.027270400524139406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,32,power_law_1.2,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,32,power_law_1.2,0.024607999622821806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,balanced,0.22618132829666138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,power_law_1.01,0.027456000447273254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,32,power_law_1.2,0.026892799139022826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,32,power_law_1.2,0.030752000212669373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,power_law_1.01,0.02810240089893341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,balanced,0.10166933139165242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,32,power_law_1.2,0.03089280128479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,power_law_1.01,0.02847360074520111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,32,power_law_1.2,0.034969601035118106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,power_law_1.01,0.031001600623130798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,32,power_law_1.2,0.03861759901046753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,balanced,0.1954560081164042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,32,power_law_1.2,0.04206719994544983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,power_law_1.01,0.03108479976654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,power_law_1.01,0.03244799971580505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,32,power_law_1.2,0.03699840009212494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,power_law_1.01,0.03552640080451965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,32,power_law_1.2,0.039647999405860904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,power_law_1.01,0.03668479919433594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,32,power_law_1.2,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,32,power_law_1.2,0.04380159974098206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,32,power_law_1.2,0.04713599979877472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,balanced,0.13889066378275552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,32,power_law_1.2,0.05354239940643311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,power_law_1.01,0.039980798959732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,32,power_law_1.2,0.0667136013507843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,power_law_1.01,0.048441600799560544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,32,power_law_1.2,0.07194240093231201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,power_law_1.01,0.05504639744758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,32,power_law_1.2,0.08912000060081482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,balanced,0.338922659556071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,32,power_law_1.2,0.10154880285263061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,32,power_law_1.2,0.15267839431762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,power_law_1.01,0.06224640011787415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,32,power_law_1.2,0.17330559492111205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,power_law_1.01,0.08565760254859925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,32,power_law_1.2,0.2849152088165283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,power_law_1.01,0.10295039415359497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,32,power_law_1.2,0.34073600769042967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,power_law_1.01,0.11882879734039306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,32,power_law_1.2,0.48764801025390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,balanced,0.17312532663345337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,32,power_law_1.2,0.8796416282653808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,power_law_1.01,0.18610559701919555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,power_law_1.2,1.8662847518920898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,32,power_law_1.2,0.03273600041866302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,power_law_1.01,0.2867392063140869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,32,power_law_1.2,0.029235199093818665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,32,power_law_1.2,0.02933120131492615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,power_law_1.01,0.33019518852233887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,32,power_law_1.2,0.03157120048999786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,32,power_law_1.2,0.03206399977207184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,32,power_law_1.2,0.0331712007522583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,power_law_1.01,0.43920001983642576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,32,power_law_1.2,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,balanced,0.21358400583267212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,power_law_1.01,0.5301439762115479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,32,power_law_1.2,0.034483200311660765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,32,power_law_1.2,0.03351680040359497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,power_law_1.01,0.9817855834960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,32,balanced,0.35089067618052167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,32,power_law_1.2,0.03351039886474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,32,power_law_1.2,0.035417601466178894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,power_law_1.01,1.8624191284179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,32,power_law_1.2,0.0358271986246109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,32,power_law_1.2,0.03699199855327606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,32,power_law_1.2,0.03818239867687225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,32,power_law_1.2,0.04118399918079376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,32,power_law_1.2,0.04258559942245484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,32,power_law_1.2,0.04590719938278198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,32,power_law_1.2,0.050348800420761106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,32,power_law_1.2,0.05746560096740723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,balanced,0.6376853386561075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,32,power_law_1.2,0.06275200247764587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,32,power_law_1.2,0.07841920256614685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,balanced,0.3463573455810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,32,power_law_1.2,0.10759680271148682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,32,power_law_1.2,0.12565120458602905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,32,power_law_1.2,0.19209599494934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,32,power_law_1.2,0.20516479015350342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,32,power_law_1.2,0.35910398960113527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,32,power_law_1.2,0.38416640758514403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,32,power_law_1.2,0.4866879940032959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,32,power_law_1.2,0.9132608413696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,32,power_law_1.2,2.5157440185546873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,balanced,0.09236266215642293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,balanced,0.0925439993540446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,balanced,0.09213866790135701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,32,power_law_1.2,0.024223999679088594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,balanced,0.10141866405804952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,balanced,0.0941973328590393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,32,power_law_1.2,0.02316800057888031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,balanced,0.09390933314959209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,32,power_law_1.2,0.02330880016088486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,balanced,0.10470933715502422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,32,power_law_1.2,0.025164800882339477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,balanced,0.10099732875823975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,32,power_law_1.2,0.02620159983634949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,balanced,0.09825066725413005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,balanced,0.659770647684733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,balanced,0.09763200084368388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,32,power_law_1.2,0.02685439884662628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,32,power_law_1.2,0.027244800329208375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,balanced,0.10146133104960124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,balanced,0.10506666700045268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,32,power_law_1.2,0.026943999528884887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,balanced,0.09422399600346883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,32,power_law_1.2,0.027398398518562316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,balanced,0.09449066718419392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,32,power_law_1.2,0.02768639922142029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,balanced,0.1000426709651947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,32,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,balanced,0.10876267155011494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,32,power_law_1.2,0.030124801397323608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,balanced,0.09005866448084514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,32,power_law_1.2,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,balanced,0.09038399656613667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,32,power_law_1.2,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,32,power_law_1.2,0.03666560053825378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,balanced,0.0921013355255127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,32,power_law_1.2,0.037894400954246524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,balanced,0.0839359958966573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,32,power_law_1.2,0.0438400000333786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,balanced,0.07669866581757863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,32,power_law_1.2,0.05386880040168762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,32,power_law_1.2,0.06432639956474304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,balanced,0.13301866253217062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,32,power_law_1.2,0.08960639834403991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,balanced,0.10801066954930623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,32,power_law_1.2,0.08796160221099854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,32,power_law_1.2,0.12773120403289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,32,power_law_1.2,0.1766144037246704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,balanced,0.149509330590566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,32,power_law_1.2,0.23354239463806153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,32,power_law_1.2,0.35747199058532714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,balanced,0.1812480092048645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,32,power_law_1.2,0.5608128070831299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,balanced,0.05970133344332377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,32,power_law_1.2,0.7285632133483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,balanced,0.06115733087062836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,balanced,0.06559466818968455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,32,power_law_1.2,0.8132224082946777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,balanced,0.06342933575312297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,balanced,0.25565866629282635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,32,power_law_1.2,1.3795392036437988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,balanced,0.06403199831644694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,balanced,0.06479466458161671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,32,power_law_1.2,3.806630325317383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,balanced,0.06322133541107178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,balanced,0.06492266555627187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,balanced,0.0673173318306605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,balanced,0.06379200021425883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,balanced,0.06727999945481618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,balanced,0.06717333197593689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,balanced,0.3291200002034505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,balanced,0.06508266429106395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,balanced,0.06979733208815257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,balanced,0.07043200234572093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.09286400079727172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,balanced,0.028794666131337483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,balanced,0.06921066840489705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.061952000856399535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.08926079869270324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,balanced,0.028560000161329906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.08884479999542236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,balanced,0.07295466462771098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.0630016028881073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,balanced,0.028757333755493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.09531520009040832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.06178560256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,balanced,0.07646933197975159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,balanced,0.030389333764712017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.06595199704170226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.09355520009994507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,balanced,0.030458666384220123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,balanced,0.08160533507664998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.09416959881782531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.06377599835395813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,balanced,0.4145653247833252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,balanced,0.03183466692765554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.09199360013008118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.06605439782142639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,balanced,0.0321066677570343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,balanced,0.0851200024286906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.09021440148353577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.06252800226211548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,balanced,0.03194666653871536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.09313920140266418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,balanced,0.03195200115442276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.06221439838409424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,balanced,0.12474133570988973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,balanced,0.032986665765444435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.0967296004295349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.061939197778701785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,balanced,0.03283733377854029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.09339519739151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.05865600109100342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,balanced,0.12590932846069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,balanced,0.033301333586374916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.060755199193954466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.08616960048675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,balanced,0.034074666599432625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.060550397634506224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.08250240087509156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,balanced,0.03446399917205175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.058931201696395874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.07715839743614197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,balanced,0.03791466603676478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.05679360032081604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,balanced,0.1725920041402181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,balanced,0.037503999968369804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.05479679703712463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.11927039623260498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.06899200081825256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.10936959981918334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,power_law_1.01,0.028121599555015565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.07684479951858521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.1465407967567444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,power_law_1.01,0.028140801191329955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,balanced,0.6141440073649088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,balanced,0.21316266059875488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.10184320211410522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.17339520454406737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,power_law_1.01,0.02821120023727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.10359040498733521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,power_law_1.01,0.030156800150871278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.21283199787139892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,power_law_1.01,0.030585598945617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.1503999948501587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.2748608112335205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,power_law_1.01,0.03128319978713989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,balanced,0.04062400013208389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.19211519956588746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.4036223888397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,power_law_1.01,0.03173120021820068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.24688000679016114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,power_law_1.01,0.03237760066986084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,balanced,0.04067733387152354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.5130047798156738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,power_law_1.01,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.3107583999633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.01,0.7283584117889405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,power_law_1.01,0.033292800188064575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,balanced,0.29868799448013306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.4908031940460205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.01,0.8969728469848632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.675270414352417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,power_law_1.01,0.03660799860954285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.01,1.3691712379455567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,power_law_1.01,0.036620798707008365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,1,128,power_law_1.2,0.0898688018321991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,1.141913604736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,power_law_1.01,0.04870400130748749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.01,2.0229375839233397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,1,128,power_law_1.2,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,power_law_1.01,0.051052802801132204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,1.357695960998535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,power_law_1.01,0.05429760217666626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,1,128,power_law_1.2,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.01,3.319846343994141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.01,1.9186431884765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,balanced,0.05527466535568237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,1,128,power_law_1.2,0.0914687991142273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.01,5.6014656066894535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,1,128,power_law_1.2,0.0912447988986969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.01,3.1957759857177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,balanced,0.38357333342234295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,power_law_1.01,0.06403200030326843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,1,128,power_law_1.2,0.09349759817123413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,power_law_1.01,0.08456959724426269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,1,128,power_law_1.2,0.09806720018386841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.01,0.10494719743728638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.01,7.39336929321289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.01,12.577683258056641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,1,128,power_law_1.2,0.0989184021949768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,1,128,power_law_1.2,0.08919039964675904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.01,0.11811840534210205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,1,128,power_law_1.2,0.0930624008178711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,balanced,0.06838933130105336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.01,0.15179519653320311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,1,128,power_law_1.2,0.08692479729652405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,1,128,power_law_1.2,0.08391039967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.01,0.16829440593719483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,balanced,0.07589333256085713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,1,128,power_law_1.2,0.07365120053291321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.01,0.26178560256958006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,balanced,0.46933865547180176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,1,128,power_law_1.2,0.07731840014457703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,1,128,power_law_1.2,0.12188800573348998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,1,128,power_law_1.2,0.11452800035476685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,1,128,power_law_1.2,0.11918079853057861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.01,0.3869823932647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,balanced,0.09452799956003825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,balanced,1.2002399762471516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,1,128,power_law_1.2,0.17276159524917603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,1,128,power_law_1.2,0.232588791847229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,1,128,power_law_1.2,0.32261760234832765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,1,128,power_law_1.2,0.40682239532470704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,1,128,power_law_1.2,0.6089216232299804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,1,128,power_law_1.2,0.8481920242309571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.01,0.4592576026916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,balanced,0.11214400331179301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,1,128,power_law_1.2,1.078656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.01,0.802393627166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,1,128,power_law_1.2,1.726950454711914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,balanced,0.7264853318532308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,1,128,power_law_1.2,3.1006399154663087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,1,128,power_law_1.2,4.2206462860107425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.01,0.919315242767334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,balanced,0.15734933813412985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,1,128,power_law_1.2,5.244831848144531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,1,128,power_law_1.2,8.963398742675782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,1,128,power_law_1.2,19.653273010253905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,power_law_1.01,1.1423999786376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,power_law_1.01,1.9105663299560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.05902079939842224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,balanced,0.19130132595698038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,power_law_1.01,3.7248191833496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.0606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.06115840077400207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.06170880198478699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.06077439785003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.06341760158538819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.061484801769256595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.060755199193954466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.06056960225105286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.0643392026424408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,balanced,0.23607999086380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.05945600271224975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.057625597715377806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.0543615996837616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.0622655987739563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.07912960052490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.07850239872932434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,balanced,1.411087989807129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.08794879913330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.10880000591278076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.13244800567626952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.19436800479888916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.2531647920608521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.38670079708099364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.5174719810485839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.7801023960113526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,1.0304320335388184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,1.6833280563354491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,balanced,0.35051198800404865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,2.2411520004272463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,1,128,power_law_1.2,2.8254720687866213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,1,128,power_law_1.2,5.0077056884765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,1,128,power_law_1.2,10.408000183105468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,balanced,0.03522666543722153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,balanced,0.034416000048319496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,balanced,0.034586665530999504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,balanced,0.036303999523321785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,balanced,0.04285866518815359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,balanced,0.03992533435424169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,balanced,0.044079999128977455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,balanced,0.042965332667032875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,1,128,power_law_1.2,0.0282368004322052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,balanced,0.043365334471066795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,balanced,0.702735980351766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,1,128,power_law_1.2,0.02821120023727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,balanced,0.04423999786376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,1,128,power_law_1.2,0.028492799401283263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,balanced,0.045114666223526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,balanced,0.04513066510359446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,1,128,power_law_1.2,0.030374398827552794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,balanced,0.04618666569391886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,1,128,power_law_1.2,0.03076480031013489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,balanced,0.048767998814582825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,1,128,power_law_1.2,0.0315200001001358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,balanced,0.05198400219281515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,1,128,power_law_1.2,0.033030399680137636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,balanced,0.0529120018084844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,1,128,power_law_1.2,0.032691198587417605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,balanced,0.051829333106676735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,balanced,0.036373332142829895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,1,128,power_law_1.2,0.03304319977760315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,balanced,0.05484800040721893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,balanced,0.03640533238649368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,1,128,power_law_1.2,0.033907198905944826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,balanced,0.03709333389997482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,balanced,0.05541866521040598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,1,128,power_law_1.2,0.03438720107078552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,balanced,0.03824000060558319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,1,128,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,balanced,0.06805333495140076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,1,128,power_law_1.2,0.04184960126876831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,balanced,0.038176000118255615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,1,128,power_law_1.2,0.050547200441360476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,balanced,0.06461333235104878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,1,128,power_law_1.2,0.05600000023841858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,balanced,0.039018665750821434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,balanced,0.07835199932257335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,1,128,power_law_1.2,0.06903039813041686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,balanced,0.03903999924659729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,balanced,0.039247999588648476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,balanced,0.07700799902280171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,1,128,power_law_1.2,0.07728639841079712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,balanced,0.03939199944337209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,1,128,power_law_1.2,0.11429760456085206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,balanced,0.0400693342089653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.01,0.0463808000087738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.2,0.13512320518493653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,balanced,0.04185600082079569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,balanced,0.09887466828028361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.01,0.03904640078544617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,balanced,0.04542933404445648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.01,0.038412800431251524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.2,0.18161280155181886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,balanced,0.04438933233420054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.01,0.04286080002784729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.2,0.2688127994537354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,balanced,0.04572266836961111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.01,0.042694398760795595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,balanced,0.10602666934331258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,balanced,0.05206400156021118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.01,0.04162560105323791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.01,0.04166400134563446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.2,0.2881664037704468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,balanced,0.026949333647886913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,balanced,0.05746666590372721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.01,0.04385280013084412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.2,0.39829120635986326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,balanced,0.026880001028378803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,balanced,0.07210666437943776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.01,0.04627839922904968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,balanced,0.026848000784715016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.01,0.046367999911308286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,balanced,0.028981332977612812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,balanced,0.15381866693496704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,balanced,0.07502399881680806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.01,0.0507968008518219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.2,0.5490880012512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,balanced,0.029813334345817566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,balanced,0.03145600110292435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.01,0.05225600004196167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,balanced,0.09500267108281453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,balanced,0.03213333338499069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.01,0.05370240211486817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.2,0.6999360084533691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,balanced,0.03149333347876867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.01,0.05360640287399292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,balanced,0.03164800008138021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.2,1.2014016151428222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.01,0.05845119953155518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,balanced,0.10576533277829488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.01,0.035359999537467955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.01,0.0597760021686554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,balanced,0.0329066663980484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,balanced,0.17258665959040323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.01,0.034790399670600894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.2,1.4177280426025392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.01,0.067603200674057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,balanced,0.03331200033426285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.01,0.03484799861907959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,balanced,0.13838932911554971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,balanced,0.03384533276160558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.01,0.07955200076103211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.01,0.034892800450325015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,balanced,0.03425066669782003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.01,0.09242240190505982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.01,0.03578880131244659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,1,128,power_law_1.2,1.839148712158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.01,0.036652800440788266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,balanced,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.01,0.11890560388565063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.01,0.03648000061511993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,1,128,power_law_1.2,2.7166656494140624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,balanced,0.03682133307059606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.01,0.11826560497283936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.01,0.03697279989719391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,balanced,0.16426133116086325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.01,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.01,0.15846400260925292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,1,128,power_law_1.2,5.394572830200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.01,0.03819519877433777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.01,0.19123200178146363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.01,0.03997440040111542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.01,0.2984767913818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.01,0.04271360039710999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,balanced,0.19673067331314087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.01,0.04302079975605011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.01,0.3252032041549683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,balanced,0.03766933331886927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.01,0.04748800098896026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.01,0.4145088195800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.01,0.05144320130348205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,balanced,0.23589332898457846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.01,0.056377601623535153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.01,0.4830336093902588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,balanced,0.042768001556396484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.01,0.06158080101013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.01,0.6499968051910401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.01,0.07750399708747864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.01,0.08213120102882385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.01,1.0877696037292481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.01,0.09784960150718688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.01,0.1128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.01,2.3856576919555663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,power_law_1.01,0.02824319899082184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,balanced,0.054666668176651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.01,0.14652160406112671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,power_law_1.01,0.027027198672294618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,balanced,0.2865920066833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.01,0.16673920154571534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,balanced,0.06006399790445963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,power_law_1.01,0.02686080038547516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.01,0.25401599407196046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,power_law_1.01,0.02963840067386627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.01,0.29663360118865967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,power_law_1.01,0.0302592009305954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,balanced,0.2998239994049072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.01,0.40590720176696776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,power_law_1.01,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,balanced,0.07369066774845123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.01,0.5878143787384034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,power_law_1.01,0.03208959996700287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.01,0.7256703853607178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,power_law_1.01,0.03203200101852417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,power_law_1.01,0.03245440125465393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,balanced,0.08372799555460612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.01,1.3130240440368652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,power_law_1.01,0.0338239997625351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,balanced,0.3439466555913289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.01,2.167692756652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,power_law_1.01,0.03649280071258545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,power_law_1.01,0.03687680065631867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,power_law_1.01,0.042630401253700254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,power_law_1.01,0.04907520115375519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,power_law_1.01,0.057792001962661745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,balanced,0.10654399792353313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,power_law_1.01,0.06166399717330932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,64,power_law_1.2,0.04586879909038544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,power_law_1.01,0.07487360239028931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,64,power_law_1.2,0.03685120046138764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,64,power_law_1.2,0.03863680064678192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,power_law_1.01,0.09349120259284974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,64,power_law_1.2,0.04173440039157868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,64,power_law_1.2,0.042259201407432556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,power_law_1.01,0.11013760566711425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,balanced,0.12826666235923767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,64,power_law_1.2,0.040863999724388124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,balanced,0.5300000111262003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,64,power_law_1.2,0.04389120042324066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,power_law_1.01,0.13863680362701417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,64,power_law_1.2,0.04482559859752655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,power_law_1.01,0.17200000286102296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,64,power_law_1.2,0.04620159864425659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,64,power_law_1.2,0.04984320104122162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,power_law_1.01,0.200927996635437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,64,power_law_1.2,0.0515392005443573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,balanced,0.18198400735855103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,64,power_law_1.2,0.053497600555419925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,balanced,0.531829317410787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,power_law_1.01,0.3384255886077881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,64,power_law_1.2,0.05425919890403748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,64,power_law_1.2,0.05427839756011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,power_law_1.01,0.4758272171020508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,64,power_law_1.2,0.061945599317550656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,power_law_1.01,0.812934398651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,64,power_law_1.2,0.06711680293083191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,64,power_law_1.2,0.07674239873886109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,power_law_1.01,0.8425087928771973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,64,power_law_1.2,0.09668480157852173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,balanced,0.2257759968439738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,64,power_law_1.2,0.10432640314102173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,64,power_law_1.2,0.16183680295944214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,64,power_law_1.2,0.1557055950164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,power_law_1.01,1.116639995574951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,64,power_law_1.2,0.23045120239257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,64,power_law_1.2,0.25372159481048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,power_law_1.01,1.5975232124328613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,64,power_law_1.2,0.4453375816345215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,64,power_law_1.2,0.5471168041229248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,power_law_1.01,3.228179168701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,64,power_law_1.2,0.6594048023223877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,64,power_law_1.2,1.0552255630493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,64,power_law_1.2,1.2176383972167968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,balanced,0.2829493284225464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,64,power_law_1.2,2.5832576751708984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,64,power_law_1.2,4.9296001434326175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,balanced,1.0101546446482341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,balanced,0.4504053195317586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,64,power_law_1.2,0.03909119963645935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,64,power_law_1.2,0.03865599930286408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,64,power_law_1.2,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,64,power_law_1.2,0.03861759901046753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,64,power_law_1.2,0.03735679984092712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,64,power_law_1.2,0.03730559945106506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,64,power_law_1.2,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,64,power_law_1.2,0.03813120126724243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,64,power_law_1.2,0.038431999087333676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,64,power_law_1.2,0.040031999349594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,64,power_law_1.2,0.04286719858646393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,64,power_law_1.2,0.04440320134162903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,64,power_law_1.2,0.048172798752784726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,64,power_law_1.2,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,64,power_law_1.2,0.055129599571228025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,64,power_law_1.2,0.05842559933662415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,64,power_law_1.2,0.06321280002593994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,64,power_law_1.2,0.08227199912071229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,64,power_law_1.2,0.028255999088287354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,64,power_law_1.2,0.09278079867362976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,64,power_law_1.2,0.026995199918746948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,64,power_law_1.2,0.12521599531173705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,64,power_law_1.2,0.027897599339485168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,64,power_law_1.2,0.12544000148773193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,64,power_law_1.2,0.029791998863220214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,balanced,0.03403733422358831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,64,power_law_1.2,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,64,power_law_1.2,0.1890496015548706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,balanced,0.872053305308024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,64,power_law_1.2,0.03150720000267029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,64,power_law_1.2,0.03192319869995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,64,power_law_1.2,0.2050175905227661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,balanced,0.03302400062481562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,64,power_law_1.2,0.03208320140838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,64,power_law_1.2,0.32427520751953126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,64,power_law_1.2,0.03218559920787811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,balanced,0.030495998760064442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,64,power_law_1.2,0.03327359855175018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,64,power_law_1.2,0.40634880065917967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,64,power_law_1.2,0.03568640053272247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,balanced,0.03201599915822347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,64,power_law_1.2,0.03766399919986725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,64,power_law_1.2,0.6126912117004395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,64,power_law_1.2,0.04030719995498657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,balanced,0.03956799954175949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,64,power_law_1.2,0.8991423606872558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,64,power_law_1.2,0.04659200012683869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,64,power_law_1.2,0.05604479908943176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,balanced,0.041333332657814026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,64,power_law_1.2,1.0340800285339355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,64,power_law_1.2,0.058847999572753905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,balanced,0.042863999803860985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,64,power_law_1.2,2.2005504608154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,balanced,0.044405331214269005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,64,power_law_1.2,0.06807680130004883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,64,power_law_1.2,0.09359359741210938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,balanced,0.04190400242805481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,64,power_law_1.2,4.182182312011719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,64,power_law_1.2,0.11574399471282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,balanced,0.04322133461634318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,balanced,0.04520000020662943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,balanced,0.0470719983180364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,64,power_law_1.2,0.13953280448913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,64,power_law_1.2,0.17541760206222534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,balanced,0.048309331138928734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,balanced,0.04673066735267639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,64,power_law_1.2,0.2610752105712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,balanced,0.05077333251635233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,64,power_law_1.2,0.35009920597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,balanced,0.05242133140563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,balanced,0.03323733309904734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,balanced,0.053210665782292686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,64,power_law_1.2,0.562611198425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,balanced,0.03204799940188726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,balanced,0.055530667304992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,balanced,0.03221333275238673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,64,power_law_1.2,0.7648896217346192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,balanced,0.05746666590372721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,balanced,0.0367253323396047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,64,power_law_1.2,1.1050304412841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,balanced,0.03892799963553747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,balanced,0.07006399830182393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,balanced,0.03749333322048187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,64,power_law_1.2,1.4478336334228517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,balanced,0.0672106643517812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,balanced,0.037861332297325134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,balanced,0.03782933453718821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,balanced,0.037818667789300285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,64,power_law_1.2,2.0534143447875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,balanced,0.08341333270072937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,balanced,0.03862933317820231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,balanced,0.038773333032925926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,64,power_law_1.2,2.8815168380737304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,balanced,0.038917332887649536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,balanced,0.08384533723195393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,balanced,0.03988266736268997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,balanced,0.041306667029857635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,64,power_law_1.2,7.222541046142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,balanced,0.04378666480382284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,balanced,0.0436106671889623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,balanced,0.10972799857457478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,balanced,0.045253331462542214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,balanced,0.051685333251953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,balanced,0.057909334699312844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,balanced,0.12187199791272481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,balanced,0.07346666852633159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.01,0.03957119882106781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,balanced,0.07876800000667572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.01,0.04353919923305512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.01,0.037427198886871335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.01,0.03566080033779144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.01,0.03338879942893982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,balanced,0.09848533074061076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.01,0.03429119884967804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.01,0.03516800105571747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,balanced,0.17836799224217734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.01,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.01,0.037190398573875426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,balanced,0.11076800028483073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.01,0.03731839954853058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.01,0.042745599150657655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,balanced,0.027066667874654133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.01,0.03678080141544342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.01,0.044268798828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.01,0.03687680065631867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,balanced,0.14867732922236124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.01,0.046214398741722104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.01,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,balanced,0.027029333015282948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.01,0.03888640105724335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.01,0.05063679814338684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,balanced,0.029616000751654308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.01,0.03954559862613678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.01,0.05113599896430969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,balanced,0.20480533440907797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,balanced,0.03035199890534083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.01,0.041196799278259276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,balanced,0.17913599809010824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.01,0.05363839864730835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,balanced,0.03169066707293192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.01,0.04242559969425201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.01,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.01,0.043987199664115906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.01,0.056620800495147706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,balanced,0.031658666829268135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.01,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.01,0.051910400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,balanced,0.032042667269706726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.01,0.05413119792938233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,balanced,0.25493866205215454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,balanced,0.032458665470282234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.01,0.05806080102920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.01,0.05491840243339539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,balanced,0.03306133300065994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.01,0.06383360028266907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.01,0.06810240149497986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,balanced,0.23679999510447183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.01,0.07635200023651123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.01,0.07790079712867737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,balanced,0.03442666679620743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.01,0.08844799995422363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.01,0.0989247977733612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,balanced,0.03495999922355016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.01,0.09952639937400817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.01,0.10921599864959716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.01,0.11434240341186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.01,0.13910399675369262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,balanced,0.317903995513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,balanced,0.04078399886687597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.01,0.14436479806900024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.01,0.16122879981994628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,balanced,0.039434666434923805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.01,0.1615231990814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.01,0.23840639591217042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.01,0.24496641159057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.01,0.2872447967529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.01,0.27701759338378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.01,0.4294911861419678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.01,0.34505600929260255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.01,0.5491199970245362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,balanced,0.040261333187421165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.01,0.5363455772399902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.01,0.6470719814300537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,balanced,0.0466186652580897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.01,0.6299327850341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.01,1.0712703704833983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,balanced,0.3834293286005656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,balanced,0.3659573396046956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,balanced,0.04797333478927612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.01,0.9470527648925782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.01,2.483168029785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.01,2.071468734741211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,power_law_1.01,0.029631999135017396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,balanced,0.06205866734186808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,power_law_1.01,0.027475199103355406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,balanced,0.0684799998998642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,power_law_1.01,0.02710399925708771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,power_law_1.01,0.029580798745155335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,power_law_1.01,0.030847999453544616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,power_law_1.01,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,balanced,0.08658666412035625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,power_law_1.01,0.032307198643684386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,power_law_1.01,0.03342080116271973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,balanced,0.5932000080744425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,power_law_1.01,0.03368319869041443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,balanced,0.09985599915186565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,power_law_1.01,0.03488639891147614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,power_law_1.01,0.03688960075378418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,32,power_law_1.2,0.039647999405860904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,power_law_1.01,0.03925760090351105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,32,power_law_1.2,0.03372159898281098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,power_law_1.01,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,32,power_law_1.2,0.031001600623130798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,power_law_1.01,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,32,power_law_1.2,0.035795199871063235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,balanced,0.13272533814112344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,32,power_law_1.2,0.03827199935913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,power_law_1.01,0.04762240052223206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,32,power_law_1.2,0.04238080084323883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,power_law_1.01,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,32,power_law_1.2,0.04348799884319306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,32,power_law_1.2,0.04731520116329193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,32,power_law_1.2,0.05134720206260681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,32,power_law_1.2,0.0514303982257843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,power_law_1.01,0.06437119841575623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,32,power_law_1.2,0.05368959903717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,power_law_1.01,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,32,power_law_1.2,0.05565440058708191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,balanced,0.6538986762364706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,power_law_1.01,0.08602880239486695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,32,power_law_1.2,0.058457601070404056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,balanced,0.1649333337942759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,32,power_law_1.2,0.05267840027809143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,power_law_1.01,0.10556800365447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,32,power_law_1.2,0.059545600414276124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,32,power_law_1.2,0.04351359903812409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,power_law_1.01,0.1319551944732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,32,power_law_1.2,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,32,power_law_1.2,0.06680319905281067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,32,power_law_1.2,0.037171199917793274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,32,power_law_1.2,0.08459519743919372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,power_law_1.01,0.16563839912414552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,32,power_law_1.2,0.0342848002910614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,32,power_law_1.2,0.09550079703330994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,balanced,0.25255467494328815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,power_law_1.01,0.23816320896148682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,32,power_law_1.2,0.11454720497131347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,32,power_law_1.2,0.038022398948669434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,32,power_law_1.2,0.11501439809799194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,32,power_law_1.2,0.03744640052318573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,32,power_law_1.2,0.16661759614944457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,power_law_1.01,0.3362623929977417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,32,power_law_1.2,0.037036800384521486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,32,power_law_1.2,0.22542719841003417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,32,power_law_1.2,0.28012158870697024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,32,power_law_1.2,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,balanced,1.1340746879577637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,power_law_1.01,0.39057919979095457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,32,power_law_1.2,0.3865920066833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,32,power_law_1.2,0.039110401272773744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,power_law_1.01,0.6504511833190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,32,power_law_1.2,0.5458240032196044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,32,power_law_1.2,0.03882879912853241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,32,power_law_1.2,0.7730944156646729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,power_law_1.01,0.8663807868957519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,balanced,0.32440000772476196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,32,power_law_1.2,0.03978880047798157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,32,power_law_1.2,1.0776703834533692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,power_law_1.01,0.8824319839477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,32,power_law_1.2,0.04173440039157868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,32,power_law_1.2,2.027680015563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,power_law_1.01,1.7294656753540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,32,power_law_1.2,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,32,power_law_1.2,0.04584319889545441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,32,power_law_1.2,3.737401580810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,power_law_1.01,3.8557056427001952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,32,power_law_1.2,0.04573439955711365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,32,power_law_1.2,0.05101439952850342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,32,power_law_1.2,0.055180799961090085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,32,power_law_1.2,0.06104320287704468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,balanced,0.3954186836878459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,32,power_law_1.2,0.07574399709701538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,32,power_law_1.2,0.08680959939956664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,32,power_law_1.2,0.11678080558776856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,32,power_law_1.2,0.1377344012260437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,32,power_law_1.2,0.15302400588989257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,32,power_law_1.2,0.20151679515838622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,32,power_law_1.2,0.2986047983169556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,32,power_law_1.2,0.3620160102844238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,32,power_law_1.2,0.6502272129058838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,32,power_law_1.2,0.8255807876586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,32,power_law_1.2,0.9023103713989258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,balanced,0.6089119911193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,32,power_law_1.2,2.2572608947753907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,32,power_law_1.2,4.238905715942383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,balanced,0.033301333586374916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,balanced,0.02914133419593175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,balanced,0.029317334294319153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,32,power_law_1.2,0.029824000597000123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,balanced,0.03204799940188726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,balanced,0.03879466652870178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,32,power_law_1.2,0.027270400524139406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,balanced,0.03969600051641464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,32,power_law_1.2,0.028230398893356323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,balanced,0.04264533519744873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,32,power_law_1.2,0.029580798745155335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,balanced,0.04269866645336151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,32,power_law_1.2,0.030662399530410767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,balanced,0.042394667863845825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,32,power_law_1.2,0.03155840039253235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,balanced,0.042453333735466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,balanced,0.04355733096599579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,32,power_law_1.2,0.03239679932594299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,balanced,0.04442666471004486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,32,power_law_1.2,0.034431999921798705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,balanced,0.045968001087506614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,32,power_law_1.2,0.035436800122261046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,balanced,1.1868693033854167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,balanced,0.05410666763782501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,32,power_law_1.2,0.03594880104064942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,32,power_law_1.2,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,balanced,0.0513973335425059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,32,power_law_1.2,0.040601599216461184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,balanced,0.05282666782538096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,32,power_law_1.2,0.040243199467658995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,balanced,0.05400000015894572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,32,power_law_1.2,0.04800640046596527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,balanced,0.05929600199063619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,balanced,0.05916266640027364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,32,power_law_1.2,0.0532800018787384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,32,power_law_1.2,0.053401601314544675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,balanced,0.07393600046634674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,balanced,0.07422400017579396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,32,power_law_1.2,0.06256639957427979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,32,power_law_1.2,0.07982079982757569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,balanced,0.09366400043169658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,32,power_law_1.2,0.09573760032653808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,32,power_law_1.2,0.13716479539871215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,balanced,0.09587732950846355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,balanced,0.03307733436425527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,32,power_law_1.2,0.16501760482788086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,balanced,0.032885332902272545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,32,power_law_1.2,0.23644800186157228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,balanced,0.03309333324432373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,balanced,0.1337279975414276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,balanced,0.03616533428430557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,32,power_law_1.2,0.30392320156097413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,balanced,0.038165333370367684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,balanced,0.03903999924659729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,balanced,0.03946666667858759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,32,power_law_1.2,0.48428797721862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,balanced,0.03945599993069967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,balanced,0.15556800365447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,balanced,0.03959999978542328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,balanced,0.04029866556326548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,32,power_law_1.2,0.6338111877441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,balanced,0.040762667854626976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,balanced,0.040735999743143715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,32,power_law_1.2,1.185574436187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,balanced,0.0418453315893809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,32,power_law_1.2,1.3124480247497559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,balanced,0.04615999758243561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,balanced,0.046906664967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,32,power_law_1.2,1.5109888076782227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,balanced,0.22769065697987875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,balanced,0.04660266637802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,32,power_law_1.2,3.172979164123535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.01,0.04699519872665405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,balanced,0.04897599915663401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,balanced,0.02759466568628947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.01,0.031455999612808226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,balanced,0.05709866682688395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,32,power_law_1.2,7.15331802368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.01,0.03223679959774017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.01,0.04195199906826019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,balanced,0.0271519993742307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,balanced,0.06276800235112508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.01,0.04036479890346527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,balanced,0.028042666614055634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.01,0.035718399286270144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.01,0.039603200554847715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,balanced,0.07886399825414021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,balanced,0.030458666384220123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.01,0.041119998693466185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.01,0.032979199290275575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,balanced,0.03223466624816259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.01,0.040863999724388124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,balanced,0.276037335395813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,balanced,0.08705066641171773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.01,0.03485440015792847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,balanced,0.03364266703526179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.01,0.04348160028457641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.01,0.037503999471664426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,balanced,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.01,0.045510399341583255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.01,0.039980798959732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.01,0.04615679979324341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,balanced,0.11043733358383179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,balanced,0.033701332906881966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.01,0.05072000026702881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.01,0.039443200826644896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,balanced,0.034527999659379326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.01,0.05232639908790589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.01,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,balanced,0.035360001027584076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.01,0.05319039821624756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,balanced,0.12446399529774983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.01,0.05299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,balanced,0.035487999518712364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,balanced,0.0367253323396047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.01,0.04209280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.01,0.0565887987613678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.01,0.0610368013381958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,balanced,0.037733333806196846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.01,0.04334079921245575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,balanced,0.1725013256072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.01,0.06096000075340271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,balanced,0.3246293266614278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.01,0.045721599459648134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,balanced,0.038005332152048744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.01,0.07679359912872315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.01,0.07898240089416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.01,0.04755200147628784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.01,0.10250240564346313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,balanced,0.044533332188924156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.01,0.1044160008430481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.01,0.04625279903411865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,balanced,0.21362666289011636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,balanced,0.043653334180514015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.01,0.14627840518951415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.01,0.05230720043182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.01,0.16519039869308472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.01,0.05441920161247253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.01,0.217523193359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.01,0.05968639850616455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.01,0.27761919498443605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.01,0.06985599994659424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.01,0.3935679912567139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,balanced,0.047210668524106346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.01,0.5080959796905518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.01,0.08210560083389282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,power_law_1.01,0.033843201398849485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,balanced,0.055829331278800964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,balanced,0.3112480044364929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.01,0.1024448037147522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.01,0.5392320156097412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,power_law_1.01,0.028288000822067262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.01,0.11345280408859253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.01,1.0417407989501952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,balanced,0.05942399799823761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,power_law_1.01,0.028806400299072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.01,0.1438591957092285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.01,2.208415985107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,power_law_1.01,0.03022719919681549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.01,0.17767679691314697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,balanced,0.480954647064209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,power_law_1.01,0.03152639865875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.01,0.24961280822753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,balanced,0.07683733105659485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,power_law_1.01,0.03391999900341034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.01,0.32697598934173583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,balanced,0.08458133538564046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.01,0.4751488208770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,balanced,0.3979146480560303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,power_law_1.01,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.01,0.6431935787200928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,power_law_1.01,0.03722879886627197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.01,0.7868607997894287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,power_law_1.01,0.037484800815582274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.01,1.1511296272277831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,power_law_1.01,0.0392192006111145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,balanced,0.113045334815979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,power_law_1.01,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.01,2.749113655090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,power_law_1.01,0.045151999592781066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,balanced,0.13455466429392496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,power_law_1.01,0.049344000220298764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,power_law_1.01,0.05427839756011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,balanced,0.4814079999923706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,power_law_1.01,0.057068800926208495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,16,power_law_1.2,0.04555520117282867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,balanced,0.20039467016855875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,16,power_law_1.2,0.031200000643730165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,power_law_1.01,0.06420480012893677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,16,power_law_1.2,0.03170560002326965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,power_law_1.01,0.08133760094642639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,16,power_law_1.2,0.03937279880046844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,power_law_1.01,0.09427840113639832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,16,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,16,power_law_1.2,0.04012799859046936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,power_law_1.01,0.11726720333099365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,16,power_law_1.2,0.04047360122203827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,power_law_1.01,0.13639039993286134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,16,power_law_1.2,0.042335999011993405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,balanced,0.2625173330307007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,16,power_law_1.2,0.04469760060310364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,16,power_law_1.2,0.05400959849357605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,power_law_1.01,0.23677439689636232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,16,power_law_1.2,0.05167359709739685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,power_law_1.01,0.29130239486694337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,16,power_law_1.2,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,balanced,0.9360319773356119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,balanced,0.7272373040517172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,16,power_law_1.2,0.053376001119613645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,power_law_1.01,0.3801151990890503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,16,power_law_1.2,0.05545600056648255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,balanced,0.38236268361409503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,16,power_law_1.2,0.05812479853630066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,power_law_1.01,0.5125184059143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,16,power_law_1.2,0.06112639904022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,power_law_1.01,0.7998655796051025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,16,power_law_1.2,0.06636160016059875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,power_law_1.01,1.0457728385925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,16,power_law_1.2,0.08435199856758117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,16,power_law_1.2,0.08154240250587463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,power_law_1.01,1.2219584465026856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,16,power_law_1.2,0.11438080072402954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,balanced,0.4902026653289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,16,power_law_1.2,0.10803200006484985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,power_law_1.01,2.0155008316040037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,16,power_law_1.2,0.15459840297698973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,power_law_1.01,4.521542358398437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,16,power_law_1.2,0.21362559795379638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,16,power_law_1.2,0.296012806892395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,16,power_law_1.2,0.3720704078674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,16,power_law_1.2,0.5148287773132324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,16,power_law_1.2,0.7641471862792969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,16,power_law_1.2,0.8928256034851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,balanced,0.6012320121129354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,16,power_law_1.2,0.04019840061664581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,16,power_law_1.2,1.7147712707519531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,16,power_law_1.2,0.03309440016746521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,16,power_law_1.2,0.032627201080322264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,16,power_law_1.2,3.636377716064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,16,power_law_1.2,0.03505280017852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,16,power_law_1.2,0.03695360124111176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,16,power_law_1.2,0.03996799886226654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,balanced,1.4176319440205891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,16,power_law_1.2,0.03952000141143799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,16,power_law_1.2,0.040454399585723874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,16,power_law_1.2,0.04092159867286682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,16,power_law_1.2,0.04199680089950562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,16,power_law_1.2,0.04506239891052246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,16,power_law_1.2,0.04798719882965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,balanced,0.9362613360087076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,16,power_law_1.2,0.04873600006103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,16,power_law_1.2,0.04614399969577789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,16,power_law_1.2,0.051097601652145386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,16,power_law_1.2,0.05559679865837097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,16,power_law_1.2,0.060710400342941284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,16,power_law_1.2,0.07596799731254578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,16,power_law_1.2,0.09088000059127807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,16,power_law_1.2,0.10432640314102173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,16,power_law_1.2,0.13274240493774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,16,power_law_1.2,0.16990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,16,power_law_1.2,0.18906240463256835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,16,power_law_1.2,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,16,power_law_1.2,0.3923072099685669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,16,power_law_1.2,0.578272008895874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,16,power_law_1.2,0.8308544158935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,16,power_law_1.2,1.0899200439453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,16,power_law_1.2,0.033529600501060484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,16,power_law_1.2,2.1045759201049803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,16,power_law_1.2,0.028224000334739686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,16,power_law_1.2,3.5070270538330077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,16,power_law_1.2,0.028627198934555054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,16,power_law_1.2,0.0310591995716095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,16,power_law_1.2,0.03226880133152008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,balanced,0.0354666660229365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,16,power_law_1.2,0.03400959968566895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,16,power_law_1.2,0.03505280017852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,balanced,0.03367999941110611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,16,power_law_1.2,0.03651840090751648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,balanced,0.035216001172860466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,16,power_law_1.2,0.03735679984092712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,balanced,0.04422933359940847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,16,power_law_1.2,0.03850879967212677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,balanced,1.8401172955830891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,16,power_law_1.2,0.03988479971885681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,balanced,0.04538666705290476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,16,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,balanced,0.0459146648645401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,16,power_law_1.2,0.046463999152183535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,balanced,0.04670399924119314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,16,power_law_1.2,0.04990079998970032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,balanced,0.04636266827583313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,balanced,0.04783466458320618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,16,power_law_1.2,0.055353599786758426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,balanced,0.04842133323351542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,16,power_law_1.2,0.0621504008769989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,balanced,0.050186668833096824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,balanced,0.050997331738471985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,16,power_law_1.2,0.06940159797668458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,balanced,0.05406400064627329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,16,power_law_1.2,0.08307200074195861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,balanced,0.05677866439024607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,16,power_law_1.2,0.09840000271797181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,balanced,0.03266133368015289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,balanced,0.057722667853037514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,balanced,0.03253333270549774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,balanced,0.06107200185457865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,16,power_law_1.2,0.1263360023498535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,balanced,0.03366400053103765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,balanced,0.06814933319886525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,16,power_law_1.2,0.17104640007019042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,balanced,0.03789866715669632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,balanced,0.07051200171311696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,16,power_law_1.2,0.2600575923919678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,balanced,0.04304533203442892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,balanced,0.08025066554546356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,16,power_law_1.2,0.3387455940246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,balanced,0.04334400097529093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,balanced,0.04354666670163473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,balanced,0.04348800083001455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,16,power_law_1.2,0.4555071830749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,balanced,0.08706133564313252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,balanced,0.04387733340263367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,balanced,0.04457066456476847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,16,power_law_1.2,0.7157695770263672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,balanced,0.11230400204658508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,balanced,0.04483200112978617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,balanced,0.04570133487383524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,16,power_law_1.2,1.0841407775878906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,balanced,0.047237331668535866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,16,power_law_1.2,1.346726417541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,balanced,0.13078932960828146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,balanced,0.05146666864554087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,16,power_law_1.2,2.1106815338134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,balanced,0.0516533354918162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,16,power_law_1.2,3.714131164550781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,balanced,0.05595199763774872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,balanced,0.19091200828552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,balanced,0.06703466673692067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,16,power_law_1.2,6.574259185791016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,balanced,0.07246399919191997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,balanced,0.08749866485595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,balanced,0.23882667223612467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,balanced,0.09682666261990865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,balanced,0.13150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,balanced,0.3463093439737956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,balanced,0.15457600355148315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,balanced,0.22426666816075644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.01,0.03790079951286316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.01,0.0359360009431839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.01,0.03369599878787995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,balanced,0.45453866322835285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.01,0.0406143993139267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.01,0.03529599905014038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,balanced,0.28917866945266724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.01,0.04108799993991852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.01,0.03727999925613403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.01,0.04471679925918579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.01,0.03856639862060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.01,0.044787201285362246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.01,0.04188160002231598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.01,0.04586879909038544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.01,0.04268159866333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.01,0.04573439955711365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.01,0.04333440065383911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,balanced,0.4243893225987752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.01,0.04867199957370758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.01,0.04318720102310181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.01,0.04963200092315674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,balanced,0.5431626637776693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.01,0.044684800505638125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.01,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.01,0.046777600049972536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.01,0.04874880015850067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.01,0.053855997323989865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.01,0.05063679814338684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.01,0.057868802547454835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.01,0.05208960175514221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.01,0.06421120166778564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.01,0.05729920268058777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.01,0.06472960114479065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.01,0.06231679916381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,balanced,0.5225173234939575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.01,0.06566399931907654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.01,0.07916160225868225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.01,0.07749760150909424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.01,0.08662400245666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.01,0.09007999897003174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.01,0.09944319725036621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.01,0.11496319770812988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.01,0.11805440187454223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.01,0.1244928002357483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.01,0.15281280279159545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.01,0.19764480590820313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.01,0.16958719491958618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.01,0.26092801094055174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,balanced,0.7667786280314127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.01,0.20040318965911866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.01,0.3782464027404785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.01,0.29871358871459963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.01,0.5088128089904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,balanced,0.6554346481959025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.01,0.37988479137420655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.01,0.6310912132263183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.01,0.5459968090057373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.01,0.8749312400817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.01,0.66943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.01,1.322374439239502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.01,0.9513664245605469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.01,2.849715232849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.01,1.5008959770202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.01,3.2478145599365233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,8,power_law_1.2,0.039980798959732056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,balanced,1.0069173177083333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,8,power_law_1.2,0.034835198521614076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,8,power_law_1.2,0.03678080141544342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,8,power_law_1.2,0.04191359877586365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,8,power_law_1.2,0.04108799993991852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,8,power_law_1.2,0.048102399706840514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,8,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,8,power_law_1.2,0.04871039986610413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,8,power_law_1.2,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,8,power_law_1.2,0.0517632007598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,8,power_law_1.2,0.05445759892463684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,balanced,1.491418679555257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,8,power_law_1.2,0.055961602926254274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,8,power_law_1.2,0.056518399715423585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,8,power_law_1.2,0.06156799793243408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,8,power_law_1.2,0.0650816023349762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,8,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,8,power_law_1.2,0.07467520236968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,8,power_law_1.2,0.08168320059776306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,8,power_law_1.2,0.08831999897956848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,8,power_law_1.2,0.1044927954673767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,8,power_law_1.2,0.144486403465271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,8,power_law_1.2,0.16059520244598388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,8,power_law_1.2,0.03624320030212402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,8,power_law_1.2,0.20666239261627198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,8,power_law_1.2,0.03320319950580597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,8,power_law_1.2,0.37147519588470457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,8,power_law_1.2,0.03463039994239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,8,power_law_1.2,0.43337597846984866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,8,power_law_1.2,0.03697920143604279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,8,power_law_1.2,0.037913599610328676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,8,power_law_1.2,0.6513408184051513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,8,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,8,power_law_1.2,0.8987775802612304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,8,power_law_1.2,0.041894400119781496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,8,power_law_1.2,1.2216256141662598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,8,power_law_1.2,0.04257279932498932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,8,power_law_1.2,0.04410240054130554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,8,power_law_1.2,1.8305088043212892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,balanced,1.9878452618916829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,8,power_law_1.2,0.046028798818588255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,8,power_law_1.2,0.046777600049972536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,8,power_law_1.2,4.556985473632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,8,power_law_1.2,0.0500927984714508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,8,power_law_1.2,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,8,power_law_1.2,0.0536191999912262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,8,power_law_1.2,0.05851519703865051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,8,power_law_1.2,0.06320639848709106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,8,power_law_1.2,0.06807039976119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,8,power_law_1.2,0.07836800217628478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,8,power_law_1.2,0.09334400296211243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,8,power_law_1.2,0.12423039674758911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,8,power_law_1.2,0.13500159978866577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,8,power_law_1.2,0.17879040241241456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,8,power_law_1.2,0.21354238986968993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,8,power_law_1.2,0.2965440034866333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,8,power_law_1.2,0.44072961807250977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,8,power_law_1.2,0.7415040016174317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,8,power_law_1.2,0.9555775642395019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,8,power_law_1.2,1.1828864097595215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,8,power_law_1.2,1.8804031372070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,8,power_law_1.2,4.294784164428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,balanced,0.03541333228349686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,balanced,0.03561066587766012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,balanced,0.03712533414363861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,balanced,0.0418453315893809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,balanced,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,balanced,0.05676266551017761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,balanced,0.05914666752020518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,balanced,0.0606879989306132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,balanced,0.03306133300065994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,balanced,0.06235733131567637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,balanced,0.06274666885534923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,balanced,0.03323733309904734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,balanced,0.05669866502285004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,balanced,0.03482133398453394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,balanced,0.059194669127464294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,balanced,0.04428266485532125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,balanced,0.06036800146102905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,balanced,0.050474668542544045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,balanced,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,balanced,0.06330666442712148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,balanced,0.05179200073083242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,balanced,0.06969066460927327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,balanced,0.051514665285746254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,balanced,0.07121600210666656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,balanced,0.05198400219281515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,balanced,0.07823466757933299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,balanced,0.05293866495291392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,balanced,0.052890668312708534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,balanced,0.08738666772842407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,balanced,0.05462933580080668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,balanced,0.09552533427874248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,balanced,0.055946667989095054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,balanced,0.05760533114274343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,balanced,0.11319466431935628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,balanced,0.0636053333679835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,balanced,0.12827199697494507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,balanced,0.06512000163396199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,balanced,0.06993066767851512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.01,0.03703039884567261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,balanced,0.17935999234517416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,balanced,0.08201600114504497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.01,0.03650560081005096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,balanced,0.08959466218948364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.01,0.035667198896408084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,balanced,0.19802133242289224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.01,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,balanced,0.10648533701896667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.01,0.054176002740859985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.01,0.056627202033996585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,balanced,0.12447466452916463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.01,0.05842559933662415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,balanced,0.30314133564631146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.01,0.05982720255851746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.01,0.060710400342941284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,balanced,0.1725013256072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.01,0.06174719929695129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.01,0.05811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.01,0.061638402938842776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,balanced,0.4224533240000407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,balanced,0.2160266637802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.01,0.06392959952354431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.01,0.06698240041732788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.01,0.07412480115890503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.01,0.07704960107803345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,balanced,0.3237706621487935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.01,0.08460800051689148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.01,0.09650560021400452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.01,0.11139199733734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,balanced,0.6237173477808634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.01,0.0348800003528595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.01,0.13245439529418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.01,0.033817601203918454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.01,0.15962239503860473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.01,0.03468799889087677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.01,0.19548159837722778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,balanced,0.4404640197753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.01,0.04142720103263855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.01,0.2435904026031494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.01,0.04457600116729736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.01,0.33692159652709963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.01,0.048582398891448976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.01,0.5099904060363769
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.01,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.01,0.731987190246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.01,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.01,0.980345630645752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.01,0.051622402667999265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,balanced,0.7411306699117025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.01,1.1341119766235352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.01,0.05278720259666443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,balanced,0.6519413391749064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.01,0.0562175989151001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.01,1.9507648468017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.01,0.059571200609207155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.01,0.06256639957427979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.01,3.6423553466796874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.01,0.07349759936332703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.01,0.0781503975391388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.01,0.08010879755020142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.01,0.10152319669723511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,balanced,0.7964533170064291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.01,0.10522240400314331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,balanced,0.9388960202534994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.01,0.13583359718322754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.01,0.15460480451583863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.01,0.20562560558319093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.01,0.29032320976257325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.01,0.3915519952774048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.01,0.47472639083862306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,4,power_law_1.2,0.03751679956912994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.01,0.7580160140991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.01,1.002355194091797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,4,power_law_1.2,0.0344895988702774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,4,power_law_1.2,0.03580160140991211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.01,1.2098752021789552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,balanced,1.0249653657277424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,4,power_law_1.2,0.04394879937171936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.01,2.220403289794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,4,power_law_1.2,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.01,4.2682239532470705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,4,power_law_1.2,0.05783680081367493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,4,power_law_1.2,0.05822719931602478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,balanced,1.430741310119629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,4,power_law_1.2,0.035366401076316833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,4,power_law_1.2,0.061791998147964475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,4,power_law_1.2,0.03315840065479279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,4,power_law_1.2,0.06166399717330932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,4,power_law_1.2,0.03473919928073883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,4,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,4,power_law_1.2,0.037945601344108584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,4,power_law_1.2,0.04389120042324066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,4,power_law_1.2,0.06154239773750305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,4,power_law_1.2,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,4,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,4,power_law_1.2,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,4,power_law_1.2,0.05107839703559876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,4,power_law_1.2,0.06312959790229797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,4,power_law_1.2,0.05204480290412903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,4,power_law_1.2,0.06845440268516541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,balanced,1.5744853019714355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,4,power_law_1.2,0.05336959958076477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,4,power_law_1.2,0.07525119781494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,4,power_law_1.2,0.0788927972316742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,4,power_law_1.2,0.05651199817657471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,4,power_law_1.2,0.08528640270233154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,4,power_law_1.2,0.06098560094833374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,4,power_law_1.2,0.10089600086212158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,4,power_law_1.2,0.06707839965820313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,4,power_law_1.2,0.11982079744338989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,4,power_law_1.2,0.06532480120658875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,4,power_law_1.2,0.13755520582199096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,4,power_law_1.2,0.0711679995059967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,4,power_law_1.2,0.16437760591506959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,4,power_law_1.2,0.08023679852485657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,4,power_law_1.2,0.20683519840240477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,4,power_law_1.2,0.08773120045661927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,4,power_law_1.2,0.270361590385437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,4,power_law_1.2,0.10374399423599243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,4,power_law_1.2,0.35688960552215576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,4,power_law_1.2,0.10803840160369874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,4,power_law_1.2,0.14209920167922974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,4,power_law_1.2,0.5654272079467774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,4,power_law_1.2,0.15892479419708253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,4,power_law_1.2,0.7107071876525879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,4,power_law_1.2,0.22576639652252198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,4,power_law_1.2,1.1026368141174316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,4,power_law_1.2,0.289190411567688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,4,power_law_1.2,1.212716770172119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,4,power_law_1.2,0.4166272163391113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,4,power_law_1.2,2.310451126098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,4,power_law_1.2,0.565388822555542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,4,power_law_1.2,0.8650431632995605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,power_law_1.2,5.162092971801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,4,power_law_1.2,1.269375991821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,4,balanced,2.8149547576904297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,4,power_law_1.2,1.6005311965942384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,4,power_law_1.2,2.61081600189209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,power_law_1.2,5.640991973876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,4,balanced,3.154618581136068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,balanced,0.05308799942334493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,balanced,0.05464000006516775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,balanced,0.06353066861629486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,balanced,0.07658133407433827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,balanced,0.08562666177749634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,balanced,0.08533866206804912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,balanced,0.08797867099444072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,balanced,0.049045334259668984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,balanced,0.08744000395139058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,balanced,0.08762666583061218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,balanced,0.04916266600290934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,balanced,0.08884800473848979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,balanced,0.049173335234324135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,balanced,0.05216533442338308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,balanced,0.08982933561007182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,balanced,0.06338666876157124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,balanced,0.0897866686185201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,balanced,0.06861333549022675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,balanced,0.09171733260154724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,balanced,0.07028266787528992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,balanced,0.09541333715120952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,balanced,0.07088000078996022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,balanced,0.09754666686058044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,balanced,0.07086400190989177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,balanced,0.07145600020885468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,balanced,0.09858133395512898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,balanced,0.07330133517583211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,balanced,0.10910933216412862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,balanced,0.07390933235486348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,balanced,0.10965333382288615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,balanced,0.07522133489449818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,balanced,0.0767626663049062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,balanced,0.1368053356806437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,balanced,0.0825439989566803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,balanced,0.08422933022181193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,balanced,0.1306613286336263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,balanced,0.04199466605981191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,balanced,0.08735466996828715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,balanced,0.04268266757329305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,balanced,0.10315199693044026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,balanced,0.1695893406867981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,balanced,0.04279999931653341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,balanced,0.045882667104403176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,balanced,0.10480533043543498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,balanced,0.06216000020503998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,balanced,0.17469867070515951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,balanced,0.0633546660343806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,balanced,0.1327946682771047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,balanced,0.06446399788061778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,balanced,0.06533866624037425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,balanced,0.13834133744239807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,balanced,0.06515733400980632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,balanced,0.24356800317764282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,balanced,0.06699199974536896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,balanced,0.06803733110427856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,balanced,0.18106667200724283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,balanced,0.06756266454855601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,balanced,0.06991999844710033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,balanced,0.0703306645154953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,balanced,0.20616000890731812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,balanced,0.27617067098617554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,balanced,0.07597333192825317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,balanced,0.07930666704972585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,balanced,0.28859732548395794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,balanced,0.08259200056393941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,balanced,0.42261866728464764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,balanced,0.34984532992045086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,balanced,0.08979733784993489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,balanced,0.0979253351688385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.01,0.09067519903182983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,balanced,0.5041546821594238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,balanced,0.5162773529688517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.01,0.08357759714126586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.01,0.0685696005821228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.01,0.06734079718589783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.01,0.07210239768028259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.01,0.06286079883575439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,balanced,0.1130560040473938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.01,0.07477120161056519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.01,0.055257600545883176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,power_law_1.01,0.06224640011787415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.01,0.08432000279426574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.01,0.0576960027217865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,4,32,power_law_1.2,0.09067519903182983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,balanced,0.1270026663939158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,power_law_1.01,0.05808640122413635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.01,0.06115840077400207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.01,0.08064640164375306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,4,32,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.01,0.06735360026359558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,power_law_1.01,0.04528000056743622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.01,0.08350719809532166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,balanced,0.6384960015614828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,4,32,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.01,0.06817280054092408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,power_law_1.01,0.05477759838104248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,balanced,0.6084693272908529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.01,0.08857600092887878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.01,0.06793599724769592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,4,32,power_law_1.2,0.07123200297355652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,power_law_1.01,0.05998079776763916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.01,0.06849279999732971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,4,32,power_law_1.2,0.07059839963912964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.01,0.08999040126800537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,balanced,0.16220266620318094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,power_law_1.01,0.06111360192298889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.01,0.07214720249176025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,4,32,power_law_1.2,0.08305919766426087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.01,0.08691200017929077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.01,0.07276160120964051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,power_law_1.01,0.06442880034446716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,4,32,power_law_1.2,0.08234239816665649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.01,0.09379199743270875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.01,0.07470080256462097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,power_law_1.01,0.06577280163764954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,4,32,power_law_1.2,0.08466560244560242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,balanced,0.18850133816401163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.01,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.01,0.07771520018577575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,4,32,power_law_1.2,0.08954880237579346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.01,0.09457280039787293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.01,0.0819263994693756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,4,32,power_law_1.2,0.0905023992061615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,power_law_1.01,0.06839680075645446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.01,0.10194560289382934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,4,32,power_law_1.2,0.09262080192565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.01,0.09139840006828308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,power_law_1.01,0.07022719979286193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,4,32,power_law_1.2,0.09592959880828858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.01,0.10645760297775268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,power_law_1.01,0.0732800006866455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.01,0.09512320160865784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,balanced,0.7807199954986572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,4,32,power_law_1.2,0.0967743992805481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,power_law_1.01,0.0732159972190857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.01,0.1176192045211792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.01,0.09807360172271729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,4,32,power_law_1.2,0.09923200011253357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,balanced,0.2603253324826558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,power_law_1.01,0.08015999794006348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.01,0.12651519775390624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.01,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,4,32,power_law_1.2,0.10401279926300049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,power_law_1.01,0.08919039964675904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.01,0.1268671989440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.01,0.1466048002243042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,4,32,power_law_1.2,0.122489595413208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.01,0.16427520513534546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.01,0.18440959453582764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,4,32,power_law_1.2,0.12800639867782593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,power_law_1.01,0.09408640265464782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.01,0.18149759769439697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,balanced,0.879968007405599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.01,0.2011199951171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,4,32,power_law_1.2,0.16424959897994995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.01,0.23546879291534423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,balanced,0.3461546500523885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,4,32,power_law_1.2,0.161190402507782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.01,0.26803200244903563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,power_law_1.01,0.10229760408401489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.01,0.29419519901275637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,4,32,power_law_1.2,0.25677440166473386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.01,0.29216001033782957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.01,0.3826368093490601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,4,32,power_law_1.2,0.23021440505981444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.01,0.3982975959777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.01,0.5074880123138428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,4,32,power_law_1.2,0.33676800727844236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,power_law_1.01,0.11608959436416626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.01,0.7149119853973389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.01,0.4686272144317627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,4,32,power_law_1.2,0.36027519702911376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,power_law_1.01,0.13551360368728638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.01,0.9774208068847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.01,0.6536128044128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,4,32,power_law_1.2,0.49008002281188967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,balanced,0.4813813368479411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.01,1.2675007820129394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.01,1.0676095962524415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,4,32,power_law_1.2,0.6334144115447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.01,1.942643165588379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,power_law_1.01,0.15994240045547486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.01,1.1823743820190429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,balanced,1.1856799920399983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,4,32,power_law_1.2,0.8202431678771973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,power_law_1.01,0.20365440845489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.01,1.9515520095825196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.01,3.927724838256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,4,32,power_law_1.2,1.3519359588623048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,power_law_1.01,0.3232640027999878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,4,32,power_law_1.2,1.9417152404785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.01,3.586521530151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,4,32,power_law_1.2,0.06691840291023254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,power_law_1.01,0.3299839973449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,4,32,power_law_1.2,3.280166244506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,4,32,power_law_1.2,0.05743359923362732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,power_law_1.01,0.536736011505127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,power_law_1.2,5.255449676513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,4,32,power_law_1.2,0.056992000341415404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,power_law_1.01,0.6635968208312988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,4,32,power_law_1.2,0.056959998607635495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,power_law_1.01,1.066156768798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,balanced,0.6315573453903198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,4,32,power_law_1.2,0.061894398927688596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,power_law_1.01,1.341043186187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,4,32,power_law_1.2,0.06776959896087646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,power_law_1.01,1.7711807250976563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,4,32,power_law_1.2,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,power_law_1.01,2.8439231872558595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,4,32,power_law_1.2,0.06996480226516724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,4,32,power_law_1.2,0.07099519968032837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,power_law_1.01,5.8820030212402346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,4,32,power_law_1.2,0.07200639843940734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,4,32,power_law_1.2,0.0745855987071991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,4,32,balanced,1.672693411509196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,balanced,0.7760907014211019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,4,32,power_law_1.2,0.0765504002571106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,4,32,power_law_1.2,0.07932159900665284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,4,32,power_law_1.2,0.0858240008354187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,4,32,power_law_1.2,0.09490560293197632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,4,32,power_law_1.2,0.1017408013343811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,4,32,power_law_1.2,0.10332800149917602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,4,32,power_law_1.2,0.13082239627838135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,4,32,power_law_1.2,0.13671679496765138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,4,32,power_law_1.2,0.18283519744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,balanced,2.335418701171875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,4,32,power_law_1.2,0.22021760940551757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,4,32,power_law_1.2,0.26149759292602537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,4,32,power_law_1.2,0.3337023973464966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,4,32,power_law_1.2,0.47579522132873536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,balanced,1.1890026728312175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,4,32,power_law_1.2,0.6115007877349854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,4,32,power_law_1.2,1.0631039619445801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,4,32,power_law_1.2,1.3845376014709472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,4,32,power_law_1.2,1.5059840202331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,4,32,power_law_1.2,2.558470344543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,4,32,power_law_1.2,6.151148986816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,balanced,2.381685256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,4,32,power_law_1.2,0.06273279786109924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,4,32,power_law_1.2,0.051660799980163576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,4,32,power_law_1.2,0.045337599515914914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,4,32,power_law_1.2,0.054771202802658084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,balanced,0.05089066425959269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,4,32,power_law_1.2,0.05737599730491638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,balanced,0.04692266881465912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,4,32,power_law_1.2,0.06219519972801209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,balanced,0.05184000233809153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,balanced,0.04766400158405304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,balanced,0.05495999753475189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,4,32,power_law_1.2,0.060096001625061034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,balanced,0.04864533245563507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,balanced,0.06364800035953522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,4,32,power_law_1.2,0.06405760049819946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,balanced,0.0526506652434667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,balanced,0.07715199887752533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,4,32,power_law_1.2,0.06622080206871032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,balanced,0.06333333253860474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,balanced,0.08717333277066548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,4,32,power_law_1.2,0.0673088014125824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,balanced,0.06974933544794719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,balanced,0.08866133292516072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,4,32,power_law_1.2,0.07175679802894593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,balanced,0.07173333565394084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,balanced,0.08963732918103536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,4,32,power_law_1.2,0.07537919878959656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,balanced,0.07246399919191997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,balanced,0.08954667051633199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,4,32,power_law_1.2,0.0762880027294159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,balanced,0.07247466842333476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,balanced,0.09000000357627869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,balanced,0.07310399909814198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,4,32,power_law_1.2,0.08673279881477355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,balanced,0.09185600280761719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.01,0.08303999900817871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,balanced,0.0747573326031367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,4,32,power_law_1.2,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,balanced,0.09270933270454407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,balanced,0.04309333364168803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,balanced,0.0746559997399648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.01,0.0893567979335785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,balanced,0.09286399682362874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,4,32,power_law_1.2,0.0979200005531311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,balanced,0.07659733295440674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.01,0.06440320014953613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,balanced,0.043605332573254905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,balanced,0.09490133325258891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.01,0.06787199974060058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,balanced,0.0788320004940033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,balanced,0.09885332981745402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,balanced,0.04811733464399973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,4,32,power_law_1.2,0.11018240451812744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.01,0.07308160066604615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,balanced,0.08310399949550629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,balanced,0.10657067100207011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,balanced,0.06267733375231425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.01,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,balanced,0.06555733581384023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,balanced,0.08538666367530823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,balanced,0.10170666376749675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,balanced,0.06716266771157582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.01,0.08333439826965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,balanced,0.08963732918103536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,balanced,0.12053333719571431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,4,32,power_law_1.2,0.127347195148468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,balanced,0.06825600067774455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.01,0.06724479794502258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.01,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,balanced,0.06764799853165944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,balanced,0.11062399546305339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,balanced,0.11741866668065389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,4,32,power_law_1.2,0.14350080490112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,balanced,0.06920533378918965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.01,0.08403199911117554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.01,0.06424959897994995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,balanced,0.1113813320795695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,balanced,0.07106666763623555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,balanced,0.15000533064206442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.01,0.08639360070228577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.01,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,balanced,0.07141866783301036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,balanced,0.14221333463986716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,4,32,power_law_1.2,0.21075839996337892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.01,0.09342719912528992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.01,0.05801600217819214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,balanced,0.14297599593798319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,balanced,0.07375999788443248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,4,32,power_law_1.2,0.29782400131225584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.01,0.09682559967041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.01,0.05811840295791626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,balanced,0.07519466678301494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,balanced,0.14658666650454202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.01,0.09363200068473816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,balanced,0.18615466356277466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,balanced,0.08116800089677174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.01,0.06719359755516052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,4,32,power_law_1.2,0.3640768051147461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.01,0.10088319778442383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.01,0.06841599941253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,balanced,0.19476799170176187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,4,32,power_law_1.2,0.4863743782043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.01,0.12400640249252319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.01,0.06869760155677795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,balanced,0.2005013426144918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,balanced,0.08541333675384521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.01,0.12794239521026612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.01,0.06907520294189454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,4,32,power_law_1.2,0.6889023780822754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,balanced,0.22445333003997803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.01,0.12083840370178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.01,0.07058560252189636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,4,32,power_law_1.2,0.9988672256469726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,balanced,0.09061333537101746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.01,0.1341312050819397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.01,0.07222399711608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,balanced,0.288154661655426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,4,32,power_law_1.2,1.411731243133545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.01,0.14582400321960448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.01,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,balanced,0.32318933804829914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.01,0.18353279829025268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.01,0.07726719975471497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,4,32,power_law_1.2,1.8911872863769532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.01,0.20156800746917725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.01,0.08060160279273987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.01,0.25501439571380613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.01,0.0882752001285553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,4,32,power_law_1.2,2.8550783157348634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,balanced,0.3316533366839091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,balanced,0.1009386678536733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.01,0.09442560076713562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.01,0.3144128084182739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,4,32,power_law_1.2,4.283244705200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,balanced,0.3930826584498088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,balanced,0.1111306647459666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.01,0.10514559745788574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.01,0.42922239303588866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,power_law_1.01,0.06258559823036194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.01,0.11646080017089844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.01,0.5239168167114258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,power_law_1.01,0.05989760160446167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,4,32,power_law_1.2,10.993791961669922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.01,0.13155839443206788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,power_law_1.01,0.046937599778175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.01,0.7428351879119873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,power_law_1.01,0.05255680084228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.01,0.16151679754257203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.01,1.083993625640869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,balanced,0.492415984471639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,power_law_1.01,0.05613440275192261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.01,0.18367999792099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,balanced,0.13148799538612366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,power_law_1.01,0.06459519863128663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.01,1.2486016273498535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.01,0.2533760070800781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,balanced,0.577397346496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,power_law_1.01,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.01,1.6980031967163085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.01,0.297708797454834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,balanced,0.15133866667747498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,power_law_1.01,0.0671999990940094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.01,0.42778878211975097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,power_law_1.01,0.06936320066452026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.01,3.6698047637939455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.01,0.5323071956634522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,power_law_1.01,0.07043200135231018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.01,0.7546751976013184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,power_law_1.01,0.07472000122070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.01,1.0455039978027343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,power_law_1.01,0.07566720247268677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,balanced,0.59825066725413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,balanced,0.2059040069580078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,power_law_1.01,0.08264319896697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.01,1.209823989868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,power_law_1.01,0.0856768012046814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,balanced,0.7137973308563232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,16,power_law_1.2,0.08267520070075988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.01,1.8349119186401368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,power_law_1.01,0.09242240190505982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,balanced,0.2587626576423645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,16,power_law_1.2,0.0617792010307312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.01,4.192319869995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,16,power_law_1.2,0.06174719929695129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,power_law_1.01,0.09751039743423462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,16,power_law_1.2,0.06668800115585327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,16,power_law_1.2,0.06974719762802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,power_law_1.01,0.1091647982597351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,16,power_law_1.2,0.07717120051383972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,16,power_law_1.2,0.08176640272140503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,balanced,0.371888001759847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,balanced,0.7114880084991455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,16,power_law_1.2,0.08424959778785705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,power_law_1.01,0.1241919994354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,16,power_law_1.2,0.08558719754219055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,balanced,0.8722773392995199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,power_law_1.01,0.1469823956489563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,16,power_law_1.2,0.09057919979095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,16,power_law_1.2,0.09327999949455261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,balanced,0.4787573417027791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,16,power_law_1.2,0.09481599926948547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,power_law_1.01,0.20021119117736816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,16,power_law_1.2,0.09729920029640197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,power_law_1.01,0.23633279800415039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,16,power_law_1.2,0.11081600189208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,16,power_law_1.2,0.11932159662246704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,power_law_1.01,0.3228480100631714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,16,power_law_1.2,0.138374400138855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,power_law_1.01,0.39978880882263185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,16,power_law_1.2,0.12307200431823731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,balanced,0.6683573722839355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,16,power_law_1.2,0.15318399667739868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,16,power_law_1.2,0.15470080375671386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,power_law_1.01,0.5905856132507324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,16,power_law_1.2,0.19724160432815552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,power_law_1.01,0.9391039848327637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,balanced,1.0533013343811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,16,power_law_1.2,0.22156798839569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,power_law_1.01,1.1719231605529785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,16,power_law_1.2,0.2968640089035034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,balanced,1.3475359280904133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,16,power_law_1.2,0.3623296022415161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,power_law_1.01,1.6237503051757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,balanced,0.8756586710611979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,16,power_law_1.2,0.5276927947998047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,power_law_1.01,2.0655168533325194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,16,power_law_1.2,0.6227712154388427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,power_law_1.01,2.8084224700927733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,16,power_law_1.2,1.0812288284301759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,16,power_law_1.2,1.3157119750976562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,power_law_1.01,6.152198410034179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,16,power_law_1.2,1.7729087829589845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,16,power_law_1.2,2.4840063095092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,power_law_1.2,4.875724792480469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,balanced,1.074133316675822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,16,balanced,1.9984320004781086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,balanced,1.672202746073405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,balanced,2.651045322418213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,16,power_law_1.2,0.0636352002620697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,16,power_law_1.2,0.054604798555374146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,16,power_law_1.2,0.05427839756011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,16,power_law_1.2,0.05687680244445801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,16,power_law_1.2,0.05894399881362915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,balanced,3.3312320709228516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,16,power_law_1.2,0.06312959790229797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,16,power_law_1.2,0.06789759993553161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,16,power_law_1.2,0.06999040246009827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,16,power_law_1.2,0.06857600212097167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,16,power_law_1.2,0.059961599111557004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,16,power_law_1.2,0.0713599979877472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,16,power_law_1.2,0.04960640072822571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,16,power_law_1.2,0.07502719759941101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,16,power_law_1.2,0.0759935975074768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,16,power_law_1.2,0.047814399003982544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,balanced,0.053029333551724754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,16,power_law_1.2,0.08061439990997314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,16,power_law_1.2,0.052716797590255736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,balanced,0.052245333790779114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,16,power_law_1.2,0.0813696026802063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,16,power_law_1.2,0.05812479853630066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,balanced,0.056015998125076294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,16,power_law_1.2,0.09248639941215515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,balanced,0.06569066643714905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,16,power_law_1.2,0.06327679753303528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,16,power_law_1.2,0.09752320051193238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,balanced,0.08164266745249431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,16,power_law_1.2,0.06640639901161194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,balanced,0.09193600217501323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,16,power_law_1.2,0.10794240236282349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,16,power_law_1.2,0.06855679750442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,balanced,0.0925546685854594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,16,power_law_1.2,0.13541120290756226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,16,power_law_1.2,0.06792960166931153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,balanced,0.09476266304651897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,16,power_law_1.2,0.13480960130691527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,16,power_law_1.2,0.07066879868507385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,balanced,0.09380267063776652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,16,power_law_1.2,0.1748800039291382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,16,power_law_1.2,0.07537919878959656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,balanced,0.09564266602198283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,16,power_law_1.2,0.19731839895248413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,16,power_law_1.2,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,balanced,0.09867200255393982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,balanced,0.09875200192133586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,16,power_law_1.2,0.08216959834098816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,16,power_law_1.2,0.28136320114135743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,balanced,0.09987733761469524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,16,power_law_1.2,0.09264000058174134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,16,power_law_1.2,0.33299200534820556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,balanced,0.09990400075912476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,16,power_law_1.2,0.10581760406494141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,16,power_law_1.2,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,balanced,0.10752532879511516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,16,power_law_1.2,0.5928192138671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,balanced,0.10910399754842122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,16,power_law_1.2,0.10535039901733398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,16,power_law_1.2,0.9437631607055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,balanced,0.11061333616574605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,16,power_law_1.2,0.11664639711380005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,balanced,0.15155733625094095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,16,power_law_1.2,1.252070426940918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,balanced,0.13133866588274637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,16,power_law_1.2,1.734726333618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,16,power_law_1.2,0.1277119994163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,balanced,0.04669866462548574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,balanced,0.16380266348520914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,16,power_law_1.2,2.4496128082275392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,16,power_law_1.2,0.15633920431137086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,balanced,0.04717333118120829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,balanced,0.16986666123072305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,16,power_law_1.2,5.89056625366211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,balanced,0.05259733398755392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,16,power_law_1.2,0.21542398929595946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,balanced,0.054383998115857445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,balanced,0.2439039945602417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,balanced,0.06941333413124084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,16,power_law_1.2,0.297491192817688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,balanced,0.07521066566308339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,balanced,0.2566666603088379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,16,power_law_1.2,0.4415616035461426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,balanced,0.0759200006723404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,16,power_law_1.2,0.5980735778808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,balanced,0.07712533573309581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,balanced,0.07761066655317943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,16,power_law_1.2,0.815180778503418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,balanced,0.3794613281885783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,16,power_law_1.2,0.9698495864868164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,balanced,0.07845333218574524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,16,power_law_1.2,1.4217856407165528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,balanced,0.07966933151086171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,balanced,0.043893332282702126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,16,power_law_1.2,2.2193023681640627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,balanced,0.07909333209196727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,balanced,0.4338293472925822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,balanced,0.045653333266576133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,balanced,0.08179200192292531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,16,power_law_1.2,2.765017509460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,balanced,0.047685335079828896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.01,0.06772480010986329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,balanced,0.052928000688552856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,balanced,0.08312533299128215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,balanced,0.06835733354091644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,16,power_law_1.2,3.8880062103271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.01,0.07427840232849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,balanced,0.07246399919191997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,balanced,0.09064533313115437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,balanced,0.07446399827798207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.01,0.05783039927482605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,balanced,0.07483200232187907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,16,power_law_1.2,11.012678527832032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,balanced,0.09301867087682088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,balanced,0.07606933514277141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,balanced,0.6662880182266235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.01,0.06873599886894226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,balanced,0.07712000111738841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,balanced,0.10037866234779358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,balanced,0.0784853349129359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.01,0.07434880137443542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,balanced,0.08024533092975616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,balanced,0.12471466263135274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,balanced,0.08298133313655853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.01,0.08492159843444824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,balanced,0.08543999989827473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,balanced,0.12276800473531087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.01,0.054764801263809205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.01,0.0865343987941742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,balanced,0.09179733196894328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,balanced,0.15099199612935385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.01,0.06241919994354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.01,0.0887615978717804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,balanced,0.09957333405812581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.01,0.0549888014793396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.01,0.08873599767684937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,balanced,0.167194664478302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,balanced,0.7809866269429525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.01,0.057081598043441775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.01,0.08967679738998413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,balanced,0.10910399754842122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.01,0.06284800171852112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,balanced,0.23380800088246664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.01,0.09902719855308532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.01,0.06931840181350708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.01,0.10340479612350464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.01,0.07258880138397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.01,0.10598399639129638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,balanced,0.2765120069185893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,balanced,0.12398933370908101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.01,0.10614399909973145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.01,0.07225599884986877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.01,0.11385600566864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,balanced,0.13760000467300415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.01,0.07439360022544861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.01,0.11877119541168213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.01,0.07497599720954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,balanced,0.39691734313964844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.01,0.13441920280456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.01,0.07841920256614685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,balanced,0.9265173276265463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.01,0.16178560256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.01,0.084307199716568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,balanced,0.1760960022608439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.01,0.1652735948562622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.01,0.0884223997592926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.01,0.2048896074295044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.01,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,balanced,0.4935520092646281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,balanced,0.2216320037841797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.01,0.09612159729003907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.01,0.23081600666046143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.01,0.10083199739456176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.01,0.2984960079193115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,balanced,0.32215466101964313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.01,0.11572480201721191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.01,0.3478271961212158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.01,0.13281919956207275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.01,0.48390398025512693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,balanced,0.39646931489308673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.01,0.1483456015586853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.01,0.6194560050964355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,balanced,0.7390186786651611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.01,0.17441279888153077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.01,0.9593279838562012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.01,0.20667519569396972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,power_law_1.01,0.05438719987869263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.01,1.1461312294006347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.01,0.2660928010940552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,power_law_1.01,0.060812801122665405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.01,0.34956159591674807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,balanced,0.558895985285441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.01,1.401318359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,power_law_1.01,0.0506496012210846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,balanced,1.4991307258605957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.01,0.4891392230987549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,power_law_1.01,0.05793920159339905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.01,2.2225215911865233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,power_law_1.01,0.06042240262031555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.01,0.6171584129333496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,power_law_1.01,0.07100160121917724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,balanced,0.8979093233744303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.01,0.9170175552368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,power_law_1.01,0.07383040189743043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.01,4.564012908935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,balanced,0.7234826882680258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.01,1.1571647644042968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,power_law_1.01,0.07504000067710877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,power_law_1.01,0.07654399871826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.01,1.585318374633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,power_law_1.01,0.07947520017623902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.01,2.2640575408935546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,power_law_1.01,0.08419200181961059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,power_law_1.01,0.08837119936943054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,power_law_1.01,0.09224960207939148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.01,4.667123031616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,power_law_1.01,0.09995520114898682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,balanced,1.0419360001881917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,power_law_1.01,0.11424640417099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,power_law_1.01,0.10700160264968872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,balanced,1.0935040314992268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,power_law_1.01,0.1360703945159912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,power_law_1.01,0.1506816029548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,balanced,1.3716106414794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,power_law_1.01,0.17447680234909058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,power_law_1.01,0.25231359004974363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,power_law_1.01,0.30877439975738524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,power_law_1.01,0.4348927974700928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,power_law_1.01,0.5529280185699463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,8,power_law_1.2,0.06750720143318176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,power_law_1.01,0.7609280109405517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,balanced,1.753119945526123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,balanced,1.6702826817830403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,8,power_law_1.2,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,power_law_1.01,0.9763263702392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,8,power_law_1.2,0.059552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,power_law_1.01,1.550419235229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,balanced,2.893690745035807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,8,power_law_1.2,0.07059839963912964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,power_law_1.01,2.1569984436035154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,8,power_law_1.2,0.07215359807014465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,power_law_1.01,2.5603776931762696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,8,power_law_1.2,0.08594560027122497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,8,power_law_1.2,0.08695039749145508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,power_law_1.01,4.587315368652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,8,power_law_1.2,0.08843520283699036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,8,power_law_1.2,0.09022079706192017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,power_law_1.01,7.622828674316406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,8,power_law_1.2,0.09301120042800903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,8,power_law_1.2,0.09763839840888977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,8,power_law_1.2,0.10492160320281982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,8,power_law_1.2,0.11167999505996704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,balanced,2.6419307390848794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,8,power_law_1.2,0.10922880172729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,8,power_law_1.2,0.12222080230712891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,8,power_law_1.2,0.13160959482192994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,8,power_law_1.2,0.14780800342559813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,8,power_law_1.2,0.1779263973236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,8,power_law_1.2,0.17200000286102296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,8,power_law_1.2,0.19708160161972046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,8,power_law_1.2,0.2334912061691284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,8,power_law_1.2,0.3061503887176514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,8,power_law_1.2,0.4286975860595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,8,power_law_1.2,0.5729152202606201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,8,power_law_1.2,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,8,power_law_1.2,0.6523647785186768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,8,power_law_1.2,0.052095997333526614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,8,power_law_1.2,1.120633602142334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,balanced,3.441770553588867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,8,power_law_1.2,0.05482879877090454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,8,power_law_1.2,1.190272045135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,8,power_law_1.2,0.056569600105285646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,8,power_law_1.2,1.7172735214233399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,8,power_law_1.2,0.06063359975814819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,8,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,8,power_law_1.2,2.791244888305664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,8,power_law_1.2,0.0712768018245697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,8,power_law_1.2,5.669561767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,8,power_law_1.2,0.07303680181503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,8,power_law_1.2,0.07578240036964416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,8,power_law_1.2,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,8,power_law_1.2,0.07897599935531616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,balanced,5.275125185648601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,8,power_law_1.2,0.08340479731559754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,8,power_law_1.2,0.08688639998435974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,8,power_law_1.2,0.08878080248832702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,8,power_law_1.2,0.10151040554046631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,8,power_law_1.2,0.10584959983825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,8,power_law_1.2,0.11921279430389405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,8,power_law_1.2,0.1501952052116394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,8,power_law_1.2,0.14835840463638306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,8,power_law_1.2,0.1838655948638916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,8,power_law_1.2,0.2248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,8,power_law_1.2,0.3182719945907593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,8,power_law_1.2,0.35960960388183594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,8,power_law_1.2,0.5801792144775391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,8,power_law_1.2,0.7284480094909668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,8,power_law_1.2,1.0673088073730468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,8,power_law_1.2,1.49552640914917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,8,power_law_1.2,0.05390080213546753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,8,power_law_1.2,1.7599807739257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,8,power_law_1.2,0.05175679922103882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,8,power_law_1.2,0.05006080269813538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,8,power_law_1.2,3.4249408721923826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,8,power_law_1.2,0.05766400098800659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,balanced,0.052202666799227394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,8,power_law_1.2,0.06157439947128296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,8,power_law_1.2,6.0621696472167965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,8,power_law_1.2,0.0707264006137848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,balanced,0.05354666709899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,8,power_law_1.2,0.07087360024452209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,balanced,0.058176000912984215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,8,power_law_1.2,0.07351040244102477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,balanced,0.07320533196131389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,8,power_law_1.2,0.07767040133476258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,balanced,0.09153067072232564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,8,power_law_1.2,0.07856000065803528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,8,power_law_1.2,0.08685439825057983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,balanced,0.09908800323804219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,8,power_law_1.2,0.08870400190353393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,balanced,0.09947733084360759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,8,power_law_1.2,0.09201920032501221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,balanced,0.101200004418691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,8,power_law_1.2,0.10327680110931396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,balanced,0.10150933265686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,8,power_law_1.2,0.11456639766693115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,balanced,0.10284266869227092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,8,power_law_1.2,0.12142080068588257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,balanced,0.10408000151316325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,balanced,0.10666132966677348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,8,power_law_1.2,0.1343808054924011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,balanced,0.10686933000882466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,balanced,0.11084799965222676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,balanced,0.11983999609947205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,8,power_law_1.2,0.16015360355377198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,balanced,0.13833066821098328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,balanced,0.047055999437967934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,8,power_law_1.2,0.19939199686050416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,balanced,0.12455466389656067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,balanced,0.050106664498647056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,balanced,0.16966400543848673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,balanced,0.05201066533724467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,8,power_law_1.2,0.27583999633789064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,balanced,0.06020266811052958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,balanced,0.15868799885114035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,8,power_law_1.2,0.3216831922531128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,balanced,0.07775466640790303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,8,power_law_1.2,0.5238719940185547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,balanced,0.20797866582870483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,balanced,0.083514670530955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,8,power_law_1.2,0.5957568168640137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,balanced,0.08505066235860188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,balanced,0.21845867236455283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,balanced,0.08675733208656311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,8,power_law_1.2,0.9407999992370606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,balanced,0.0867199997107188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,balanced,0.318720002969106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,balanced,0.08711466193199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,8,power_law_1.2,1.360364818572998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,balanced,0.08918933073679607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,8,power_law_1.2,1.7937152862548829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,balanced,0.09134399890899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,8,power_law_1.2,2.2184959411621095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,balanced,0.378383994102478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,balanced,0.09344533085823059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,balanced,0.09682133793830872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,8,power_law_1.2,3.559519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,balanced,0.10419733325640361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,8,power_law_1.2,5.2169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,balanced,0.108815997838974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,balanced,0.5660640001296997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,balanced,0.11549333731333415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,8,power_law_1.2,11.467142486572266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,balanced,0.16171733538309732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,balanced,0.1473973294099172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,balanced,0.6873119672139486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,balanced,0.1918720006942749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,balanced,0.2095093329747518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,balanced,0.3064746658007304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,balanced,1.0158080259958904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,balanced,0.3888266483942668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.01,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,balanced,0.5581546624501547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.01,0.0723136007785797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,balanced,1.2075146834055583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.01,0.06876159906387329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.01,0.07580800056457519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.01,0.09008640050888062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,balanced,0.7303199768066406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.01,0.09280639886856079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.01,0.05063679814338684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.01,0.09681919813156128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.01,0.09836800098419189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.01,0.0616320013999939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.01,0.09979519844055176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.01,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.01,0.1022271990776062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.01,0.060703998804092406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.01,0.10700160264968872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.01,0.06505600214004517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,balanced,1.4646347363789876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,balanced,1.07204802831014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.01,0.11201280355453491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.01,0.07865599989891052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.01,0.07930240035057068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.01,0.12184959650039673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.01,0.08143360018730164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.01,0.14262399673461915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.01,0.08154240250587463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.01,0.15323519706726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.01,0.08421760201454162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.01,0.14371199607849122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.01,0.09085440039634704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.01,0.18735359907150267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.01,0.09311360120773315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.01,0.09843840003013611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.01,0.1943168044090271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,balanced,1.304800033569336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.01,0.10192639827728271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.01,0.2334656000137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.01,0.10949120521545411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.01,0.2748800039291382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.01,0.11829760074615478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.01,0.33936638832092286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.01,0.13063039779663085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.01,0.16510080099105834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.01,0.48549761772155764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.01,0.17446399927139283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.01,0.6079743862152099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,balanced,2.3435306549072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.01,0.21395199298858641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.01,0.7334784030914306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.01,0.25477759838104247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.01,1.106387233734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.01,0.3358272075653076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.01,0.3995840072631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.01,1.5113856315612793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,balanced,1.6068320274353027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,4,power_law_1.2,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.01,0.6027071952819825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.01,1.9701120376586914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,4,power_law_1.2,0.06416000127792358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.01,0.7932544231414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,4,power_law_1.2,0.05902720093727112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.01,2.792531204223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,4,power_law_1.2,0.06967679858207702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.01,1.220588779449463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,4,power_law_1.2,0.07553920149803162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.01,1.5543423652648927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,4,power_law_1.2,0.09045760035514831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.01,5.848064041137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,4,power_law_1.2,0.09321600198745728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.01,1.9341760635375977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,4,power_law_1.2,0.0983295977115631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.01,2.98275203704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,4,power_law_1.2,0.09698560237884521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,4,power_law_1.2,0.10109440088272095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,4,power_law_1.2,0.10492160320281982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.01,6.234214401245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,4,power_law_1.2,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,4,power_law_1.2,0.11230720281600952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,4,power_law_1.2,0.12773120403289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,4,power_law_1.2,0.1453503966331482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,4,power_law_1.2,0.15020159482955933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,balanced,2.536245346069336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,4,power_law_1.2,0.1664512038230896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,4,power_law_1.2,0.18409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,4,power_law_1.2,0.20130560398101807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,4,power_law_1.2,0.24206719398498536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,4,power_law_1.2,0.29285759925842286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,4,power_law_1.2,0.3713792085647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,4,power_law_1.2,0.4955264091491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,4,power_law_1.2,0.666476821899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,4,power_law_1.2,0.8969920158386231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,balanced,4.674655914306641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,4,power_law_1.2,1.320627212524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,4,power_law_1.2,1.5468159675598145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,4,power_law_1.2,1.8870080947875976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,4,power_law_1.2,3.4702079772949217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,4,power_law_1.2,7.782310485839844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,4,power_law_1.2,0.05052800178527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,balanced,5.013152122497559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,4,power_law_1.2,0.04862079918384552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,4,power_law_1.2,0.052928000688552856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,4,power_law_1.2,0.05979520082473755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,4,power_law_1.2,0.0641152024269104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,4,power_law_1.2,0.07591040134429931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,4,power_law_1.2,0.07933440208435058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,4,power_law_1.2,0.08135039806365967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,4,power_law_1.2,0.08209919929504395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,4,power_law_1.2,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,4,power_law_1.2,0.09169279932975768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,4,power_law_1.2,0.09408000111579895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,4,power_law_1.2,0.09884160161018371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,4,power_law_1.2,0.10341759920120239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,4,power_law_1.2,0.11603840589523315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,4,power_law_1.2,0.11799039840698242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,4,power_law_1.2,0.13804160356521605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,4,power_law_1.2,0.1720128059387207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,4,power_law_1.2,0.17297279834747314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,4,power_law_1.2,0.21437439918518067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,4,power_law_1.2,0.2699007987976074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,4,power_law_1.2,0.35829761028289797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,4,power_law_1.2,0.46579837799072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,4,power_law_1.2,0.6427455902099609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,4,power_law_1.2,0.8559359550476074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,4,power_law_1.2,1.4778559684753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,4,power_law_1.2,1.7159231185913086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,4,power_law_1.2,2.330713653564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,4,power_law_1.2,3.9631679534912108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,4,power_law_1.2,7.037158203125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,balanced,0.19530133406321207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,balanced,0.19117865959803262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,balanced,0.19314134120941162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,balanced,0.1994719902674357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,balanced,0.20295466979344687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,balanced,0.3489493529001872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,balanced,0.5122079849243164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,balanced,0.5291200081507365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,balanced,0.5207733313242594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,balanced,0.520090659459432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,balanced,0.4960266749064128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,balanced,0.483237346013387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,balanced,0.11917333801587422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,balanced,0.509605328241984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,balanced,0.1148373285929362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,balanced,0.5029333432515463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,balanced,0.12037332852681477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,balanced,0.5092800060907999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,balanced,0.12524799505869547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,balanced,0.5491360028584799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,balanced,0.1241919994354248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,balanced,0.507914662361145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,balanced,0.19920533895492554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,balanced,0.5013066530227661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,balanced,0.2837120095888774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,balanced,0.27190399169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,balanced,0.5184853474299113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,balanced,0.279423991839091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,balanced,0.2943360010782878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,balanced,0.4870719909667969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,balanced,0.29083200295766193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,balanced,0.056890666484832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,balanced,0.49696532885233563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,balanced,0.2976693312327067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,balanced,0.0543093333641688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,balanced,0.31568533182144165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,balanced,0.05710400144259135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,balanced,0.2919519941012065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,balanced,0.061717331409454346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,balanced,0.5013066530227661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,balanced,0.05982933441797892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,balanced,0.28885332743326825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,balanced,0.07394666473070781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,balanced,0.2847786744435628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,balanced,0.09029866258303325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,balanced,0.31031999985376996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,balanced,0.4862240155537923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,balanced,0.09083732962608337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.5048895835876465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,balanced,0.2999946673711141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,balanced,0.09168000022570293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,balanced,0.3139253258705139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,balanced,0.09192533294359843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.49225602149963377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,balanced,0.09326400359471639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,balanced,0.3169386585553487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,balanced,0.41866668065388996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.5010560035705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,balanced,0.09469333291053772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,balanced,0.34935466448465985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.36878080368041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,balanced,0.09526933232943217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,balanced,0.0962559978167216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,balanced,0.3724586566289266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.4140927791595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,balanced,0.10460799932479858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,balanced,0.9317279656728109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,balanced,0.10381866494814555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.4455872058868408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,balanced,0.3912959893544515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,balanced,0.10889066259066264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.29015040397644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.4517504215240479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,balanced,0.11763200163841248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.44133758544921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.2796736001968384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,balanced,0.40485866864522296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.29252479076385496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.4799359798431396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,balanced,0.8002453645070394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.201580810546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.5184512138366699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.459827184677124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,balanced,0.1276586651802063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.23978240489959718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.45484161376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,balanced,0.7126293182373047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.23987839221954346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.4522047996520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.2807487964630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.4860991954803467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.2834687948226929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,power_law_1.01,0.091839998960495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.47394561767578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.27647359371185304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,balanced,1.2821226914723713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,power_law_1.01,0.08436480164527893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.49580159187316897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.282092809677124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,balanced,0.14525333046913147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,power_law_1.01,0.08298879861831665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,balanced,0.7450933456420898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.2712127923965454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,power_law_1.01,0.07227519750595093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.44976000785827636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,balanced,0.16131732861200967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,power_law_1.01,0.08196480274200439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.2484544038772583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.38883199691772463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,power_law_1.01,0.08954880237579346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.2832063913345337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,power_law_1.01,0.09060479998588562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.546560001373291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,balanced,0.19151467084884644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,power_law_1.01,0.0885312020778656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.5812416076660156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.2781375885009766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,power_law_1.01,0.08926720023155213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,power_law_1.01,0.08659840226173401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.7724160194396973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.25956480503082274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,power_law_1.01,0.09377279877662659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,balanced,1.7051626841227214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,balanced,1.1157120068868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.2773184061050415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.01,1.0236607551574708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,power_law_1.01,0.09006720185279846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,power_law_1.01,0.10060800313949585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.2727231979370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.01,1.0645055770874023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,power_law_1.01,0.10471680164337158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.32179200649261475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.01,1.6012096405029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,power_law_1.01,0.11195520162582398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.3761728048324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,power_law_1.01,0.11784319877624512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.01,2.0389120101928713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,balanced,0.2249173323313395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.411846399307251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,power_law_1.01,0.13501440286636351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.01,2.8589311599731446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,power_law_1.01,0.17003519535064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.49836158752441406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.7356224060058594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.01,4.364736175537109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,balanced,0.2826666633288066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,1.0101951599121093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.01,0.1778175950050354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.01,4.752473449707031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,balanced,1.4415733019510906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,1.1477055549621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,1.8583808898925782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.01,7.903225708007812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.01,0.19095679521560668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,2.418911933898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.01,0.2129215955734253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,balanced,2.5075039863586426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.01,3.4333118438720702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.01,16.610214233398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.01,0.3142848014831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.01,5.297830581665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,balanced,0.36027733484903973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.01,0.34596478939056396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.511737585067749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.2861504077911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.01,0.532096004486084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.01,11.21942367553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.4951295852661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.27913599014282225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.46933760643005373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.01,0.6701183795928956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.2685247898101807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.3422784090042114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.2278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.01,1.0681535720825195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,balanced,0.4846026500066121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.34824318885803224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.21719040870666503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.01,1.34585599899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,balanced,2.1675732930501304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.4443840026855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.2729408025741577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,power_law_1.01,1.5768256187438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.4127039909362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.2500992059707642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.26387839317321776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.48129920959472655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.26483840942382814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.44802560806274416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.26672000885009767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.48003201484680175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,balanced,0.630016009012858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.281113600730896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,power_law_1.01,2.7396480560302736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.5051583766937255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.2674815893173218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.4960576057434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,power_law_1.01,5.76506233215332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.47521281242370605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.27209599018096925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.44727678298950196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.2507967948913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.4284224033355713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.2580287933349609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.48891520500183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.26000640392303465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.4012735843658447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.561734390258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.3083008050918579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,balanced,0.7827573617299398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.6050623893737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.33596799373626707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,balanced,4.53655465443929
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.6652863979339599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.41210241317749025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.8226240158081055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.5171520233154296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,1,128,power_law_1.2,1.408672046661377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.667903995513916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,1,128,power_law_1.2,1.6530111312866211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,1.0198464393615723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,1,128,power_law_1.2,2.075974464416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,1.2183168411254883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,1,128,power_law_1.2,2.9232831954956056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,1.883603286743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,2.5947967529296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,1,128,power_law_1.2,4.610003280639648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,3.6183807373046877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,balanced,4.046661376953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,1,128,power_law_1.2,7.205478668212891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,1,128,power_law_1.2,5.4804542541503904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,1,128,power_law_1.2,8.815174102783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,1,128,power_law_1.2,7.989369964599609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,balanced,1.2364479700724285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,1,128,power_law_1.2,15.626048278808593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,1,128,power_law_1.2,17.43761291503906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,1,128,power_law_1.2,41.995233154296876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,balanced,2.447807947794596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,balanced,0.1190720001856486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,1,128,power_law_1.2,0.0917631983757019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,balanced,0.11636799573898315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,balanced,0.12178666392962138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,1,128,power_law_1.2,0.08387200236320495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,balanced,0.12294933199882507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,1,128,power_law_1.2,0.08261119723320007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,balanced,0.20210667451222739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,1,128,power_law_1.2,0.07218559980392455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,balanced,0.36884268124898273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,1,128,power_law_1.2,0.07621759772300721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,balanced,0.5117813348770142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,1,128,power_law_1.2,0.08914560079574585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,balanced,0.5182613531748453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,1,128,power_law_1.2,0.081740802526474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,balanced,0.5200053453445435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,1,128,power_law_1.2,0.08833919763565064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,balanced,0.5187466541926066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,1,128,power_law_1.2,0.09151999950408936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,balanced,0.5061493317286173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,1,128,power_law_1.2,0.0869055986404419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,balanced,0.5027360121409098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,balanced,0.07796266674995422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,balanced,0.5320373376210531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,1,128,power_law_1.2,0.09148799777030944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,balanced,0.08142933249473572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,balanced,0.4970879952112834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,1,128,power_law_1.2,0.09253759980201721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,balanced,0.07972266773382823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,balanced,0.5208106835683187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,balanced,0.08120533327261607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,1,128,power_law_1.2,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,balanced,0.5084853172302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,balanced,0.13353600104649863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,1,128,power_law_1.2,0.10958720445632934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,balanced,0.21363733212153116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,balanced,0.5206079880396525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,balanced,0.29998934268951416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,1,128,power_law_1.2,0.11202559471130372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,balanced,0.49430398146311444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,balanced,0.29127466678619385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,1,128,power_law_1.2,0.12365440130233765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,balanced,0.30217599868774414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,balanced,0.527509331703186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,balanced,0.30103999376296997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,1,128,power_law_1.2,0.1478656053543091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,balanced,0.5593066612879435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,balanced,0.29889599482218426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,1,128,power_law_1.2,0.18439040184020997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,balanced,0.3086559971173604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,balanced,0.3078933358192444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,balanced,0.5172959963480631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,balanced,0.3140373428662618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,balanced,0.2943733334541321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.2,0.19352960586547852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,balanced,0.4991360108057658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,balanced,0.2988693316777547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,balanced,0.29153599341710407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,balanced,0.2942986687024434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.2,0.21341440677642823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,balanced,0.5038079818089803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.01,0.5261119842529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,balanced,0.3192533254623413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.2,0.25754880905151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.01,0.5080448150634765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,balanced,0.3332800070444743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.2,0.38757760524749757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.01,0.5322688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,balanced,0.04609066744645437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,balanced,0.447221318880717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,balanced,0.35683735211690265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.01,0.23155200481414795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,balanced,0.046853333711624146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.2,0.49356799125671386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,balanced,0.04677333434422811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,balanced,0.3872106472651164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.01,0.2840127944946289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,balanced,0.04882133503754934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.2,0.7064320087432862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,balanced,0.06047466893990835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.01,0.3905600070953369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,balanced,0.9549973011016846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.01,0.30556800365448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,balanced,0.40451733271280926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,balanced,0.07452799876530965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.01,0.3959680080413818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.2,0.9173439979553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.01,0.29513599872589114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,balanced,0.09044266740481059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.01,0.46707839965820314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.2,1.3215871810913087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.01,0.308409595489502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,balanced,0.09142933289210002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.01,0.4704063892364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,balanced,0.4247093200683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.01,0.13656320571899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.2,1.9792959213256835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,balanced,0.09142399827639262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.01,0.44328961372375486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.01,0.1711680054664612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,balanced,0.09215999643007915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,1,128,power_law_1.2,2.850489616394043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.01,0.443225622177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,balanced,0.8151413599650065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.01,0.22481279373168944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,balanced,0.09256533781687419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.01,0.4285696029663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,balanced,0.09494933485984802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.01,0.2382335901260376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,balanced,0.721664031346639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,1,128,power_law_1.2,4.045145416259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.01,0.44161281585693357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,balanced,0.0974666674931844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.01,0.2723968029022217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.01,0.25920639038085935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,1,128,power_law_1.2,7.888179016113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.01,0.4746880054473877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,balanced,0.09669333696365356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.01,0.26973440647125246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.01,0.46628479957580565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,balanced,0.10482133428255717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.01,0.25321600437164304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.01,0.5081600189208985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,balanced,0.7786186536153158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,power_law_1.01,0.09602559804916382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,balanced,0.10493333141009013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,balanced,1.3323360284169514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.01,0.25692799091339114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.01,0.43096318244934084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,power_law_1.01,0.0856383979320526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,balanced,0.11081066727638245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.01,0.2669375896453857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,power_law_1.01,0.08451840281486511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.01,0.42133121490478515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,balanced,0.1199733316898346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.01,0.27998719215393064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,power_law_1.01,0.061990398168563846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.01,0.541548776626587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.01,0.2549312114715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,power_law_1.01,0.06934400200843811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.01,0.6322944164276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.01,0.28787200450897216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,power_law_1.01,0.07608960270881653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,balanced,1.161072015762329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.01,0.6667712211608887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.01,0.28803839683532717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,power_law_1.01,0.07564799785614014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,balanced,0.13006933530171713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.01,0.8198911666870117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.01,0.27815680503845214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,power_law_1.01,0.08842880129814149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,balanced,1.7894293467203777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.01,0.30997118949890134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,power_law_1.01,0.08615679740905761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.01,0.9982080459594727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.01,0.32855679988861086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,power_law_1.01,0.08655999898910523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.01,1.3763839721679687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.01,0.3962048053741455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,power_law_1.01,0.09113600254058837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.01,1.59999361038208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.01,0.5462016105651856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,power_law_1.01,0.09392639994621277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.01,0.6531328201293946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.01,2.4349056243896485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,power_law_1.01,0.09520639777183533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,balanced,0.14991999665896097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,balanced,1.5138506889343262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,power_law_1.01,0.09717760086059571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.01,0.8809215545654296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,64,power_law_1.2,0.5205503940582276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.01,3.085580825805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,power_law_1.01,0.10864640474319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,balanced,0.16818133989969888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.01,1.0570943832397461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,64,power_law_1.2,0.5130496025085449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.01,3.793926239013672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,power_law_1.01,0.11397759914398194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,64,power_law_1.2,0.4597311973571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.01,1.6588159561157227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,64,power_law_1.2,0.1968384027481079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,power_law_1.01,0.12360960245132446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,balanced,0.19993066787719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.01,6.108319854736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.01,2.0630975723266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,64,power_law_1.2,0.2962752103805542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,power_law_1.01,0.14750720262527467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,64,power_law_1.2,0.31578879356384276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.01,2.526521682739258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,64,power_law_1.2,0.4207871913909912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.01,12.916581726074218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.01,3.9224193572998045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,64,power_law_1.2,0.45418238639831543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,balanced,2.640906651814779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,power_law_1.01,0.16309759616851807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,64,power_law_1.2,0.4179711818695068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.01,8.373689270019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,64,power_law_1.2,0.4244224071502686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,64,power_law_1.2,0.43206400871276857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,power_law_1.01,0.18791040182113647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,64,power_law_1.2,0.4817471981048584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,balanced,0.23798400163650513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,power_law_1.01,0.21673600673675536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,64,power_law_1.2,0.3654911994934082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,balanced,2.263045310974121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,64,power_law_1.2,0.456774377822876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,power_law_1.01,0.2965951919555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,64,power_law_1.2,0.4660352230072021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,balanced,0.30287466446558636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,64,power_law_1.2,0.42374401092529296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,64,power_law_1.2,0.46287999153137205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,power_law_1.01,0.36195199489593505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,64,power_law_1.2,0.5189760208129883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,power_law_1.01,0.5183296203613281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,64,power_law_1.2,0.5408383846282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,power_law_1.01,0.631987190246582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,balanced,0.3948800166447957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,64,power_law_1.2,0.6869247913360595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,64,power_law_1.2,0.8134079933166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,power_law_1.01,1.004857635498047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,64,power_law_1.2,0.9402239799499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,power_law_1.01,1.3040639877319335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,64,power_law_1.2,1.3225855827331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,64,power_law_1.2,1.7630720138549805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,balanced,0.5393493175506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,64,power_law_1.2,2.0893312454223634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,power_law_1.01,1.5132991790771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,64,power_law_1.2,3.7118785858154295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,64,power_law_1.2,5.179603195190429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,64,power_law_1.2,5.263302230834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,power_law_1.01,2.523423957824707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,64,power_law_1.2,9.291251373291015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,balanced,0.7232320308685303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,power_law_1.01,5.229043197631836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,balanced,4.629514694213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,64,power_law_1.2,21.948492431640624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,balanced,4.235530535380046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,balanced,0.8856426874796549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,balanced,1.3923892974853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,64,power_law_1.2,0.31525120735168455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,64,power_law_1.2,0.30030720233917235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,64,power_law_1.2,0.29367039203643797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,64,power_law_1.2,0.16202880144119264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,64,power_law_1.2,0.20206079483032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,64,power_law_1.2,0.19326080083847047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,64,power_law_1.2,0.19596799612045288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,64,power_law_1.2,0.2663680076599121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,64,power_law_1.2,0.28806400299072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,64,power_law_1.2,0.298905611038208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,64,power_law_1.2,0.2606656074523926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,64,power_law_1.2,0.2624063968658447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,64,power_law_1.2,0.26944000720977784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,64,power_law_1.2,0.2501503944396973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,64,power_law_1.2,0.27185280323028566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,64,power_law_1.2,0.2736063957214355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,64,power_law_1.2,0.26737279891967775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,64,power_law_1.2,0.29947519302368164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,64,power_law_1.2,0.3632128000259399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,64,power_law_1.2,0.38787839412689207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,64,power_law_1.2,0.475878381729126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,64,power_law_1.2,0.6688767910003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,64,power_law_1.2,0.7626239776611328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,64,power_law_1.2,1.1457152366638184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,64,power_law_1.2,1.4374400138854981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,64,power_law_1.2,2.037958335876465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,64,power_law_1.2,0.09541760087013244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,balanced,2.7137600580851235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,64,power_law_1.2,2.6596096038818358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,64,power_law_1.2,0.08470399975776673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,balanced,0.08308800061543782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,64,power_law_1.2,0.08363519906997681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,64,power_law_1.2,3.114521598815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,64,power_law_1.2,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,balanced,0.08141866823037465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,64,power_law_1.2,6.202016067504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,balanced,0.08264000217119853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,64,power_law_1.2,0.07462400197982788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,balanced,0.11194666226704915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,64,power_law_1.2,0.07432320117950439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,64,power_law_1.2,13.584474182128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,64,power_law_1.2,0.07406079769134521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,balanced,0.19273600975672403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,64,power_law_1.2,0.08170880079269409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,balanced,0.35605867703755695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,64,power_law_1.2,0.08279039859771728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,64,power_law_1.2,0.0840063989162445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,balanced,0.5397546688715616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,64,power_law_1.2,0.0880895972251892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,balanced,0.5221386750539144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,64,power_law_1.2,0.09105280041694641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,balanced,0.5179093281428019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,balanced,0.525871992111206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,64,power_law_1.2,0.09771519899368286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,balanced,0.5033493439356486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,64,power_law_1.2,0.1007807970046997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,balanced,0.5271999835968018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,64,power_law_1.2,0.10986239910125732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,balanced,0.5318826834360758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,64,power_law_1.2,0.1146496057510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,balanced,0.4918453296025594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,64,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,balanced,0.4793599843978882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,balanced,0.506437341372172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,64,power_law_1.2,0.1575744032859802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,balanced,0.5047626495361328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,balanced,0.4901866515477498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,64,power_law_1.2,0.18564480543136597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,balanced,0.5363893508911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,balanced,0.517525315284729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,64,power_law_1.2,0.2091968059539795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,balanced,0.5129599968592325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,64,power_law_1.2,0.23907840251922607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,64,power_law_1.2,0.3545664072036743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,balanced,0.06826133529345195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,balanced,0.5552693208058676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.01,0.2243648052215576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.01,0.3451904058456421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,balanced,0.07301866511503856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.01,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,balanced,0.08092266817887624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.01,0.5020287990570068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,balanced,0.5080533425013224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.01,0.32115199565887453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,64,power_law_1.2,0.44832639694213866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,balanced,0.12994666894276938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.01,0.511359977722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.01,0.11465599536895751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,balanced,0.21220266819000244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,64,power_law_1.2,0.6648447990417481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.01,0.15382399559020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,balanced,0.3108160098393758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.01,0.17861759662628174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.01,0.20885119438171387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,64,power_law_1.2,0.8611328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,balanced,0.3118079900741577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,balanced,0.4718506733576457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.01,0.23666560649871826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.01,0.22743680477142333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,balanced,0.3052159945170085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,balanced,0.0461760014295578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,64,power_law_1.2,1.4517951965332032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.01,0.33702399730682375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.01,0.2509119987487793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,balanced,0.32553066809972125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,balanced,0.04671466847260793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.01,0.24634881019592286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,64,power_law_1.2,1.870137596130371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.01,0.39599359035491943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,balanced,0.30271466573079425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.01,0.26184959411621095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,balanced,0.04689066608746847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.01,0.27631359100341796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.01,0.41303038597106934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,balanced,0.30931733051935834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,balanced,0.04967466493447622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,balanced,1.0196479956309001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.01,0.26282238960266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,64,power_law_1.2,2.1313472747802735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,balanced,0.062458669145902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,balanced,0.3065813382466634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.01,0.2815615892410278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.01,0.41484799385070803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,balanced,0.07613333563009898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,balanced,0.30144532521565753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.01,0.28051199913024905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,balanced,0.09373866518338521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,balanced,0.3070506652196248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,64,power_law_1.2,3.845926284790039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.01,0.44124798774719237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.01,0.2920128107070923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,balanced,0.09478400150934856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,balanced,0.3074079950650533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.01,0.2825023889541626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,balanced,0.0957973301410675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.01,0.3892672061920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,64,power_law_1.2,7.3805694580078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,balanced,0.3130720059076945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.01,0.2754816055297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,balanced,0.8840746879577637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,balanced,0.09613333145777385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.01,0.2712575912475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,balanced,0.0974133312702179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.01,0.482374382019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,balanced,0.3055306673049927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.01,0.3283391952514648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,balanced,0.09830933809280396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,balanced,0.3391093413035075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.01,0.37941761016845704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.01,0.4581183910369873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,balanced,0.10044800241788228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.01,0.4210048198699951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,balanced,0.32975999514261883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,balanced,0.1021066705385844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.01,0.43721599578857423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.01,0.5384575843811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,balanced,0.10935466488202412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.01,0.6571775913238526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,balanced,0.36025067170461017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.01,0.42344322204589846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,balanced,0.10961600144704182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,balanced,1.3938934008280437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.01,0.8068608283996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,balanced,0.11550399661064148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.01,0.49013118743896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.01,1.1165120124816894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,balanced,0.3910133441289266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.01,1.549779224395752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.01,0.4276864051818848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,balanced,0.12682132919629416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.01,2.066624069213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.01,0.45825920104980467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,balanced,0.4038453499476115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.01,2.4271615982055663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.01,0.4584512233734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.01,0.5233471870422364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.01,3.9726398468017576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.01,0.6889344215393066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,balanced,0.13944533467292786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,balanced,0.4530773162841797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.01,6.829708862304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.01,0.7266176223754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,balanced,1.9228746096293132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.01,0.9082367897033692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.01,1.2063936233520507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.01,1.393843173980713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,balanced,0.7991147041320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,balanced,0.16011200348536173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.01,2.021561622619629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.01,2.5033344268798827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,balanced,0.18123199542363486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.01,3.6582401275634764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,balanced,0.21935999393463135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,balanced,0.8384586970011393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.01,4.882521438598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.01,10.018208312988282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,balanced,2.823919932047526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,balanced,0.26551999648412067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,32,power_law_1.2,0.3652224063873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,balanced,1.2279893557230632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,32,power_law_1.2,0.495468807220459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,32,power_law_1.2,0.5311039924621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,balanced,0.3484586477279663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,32,power_law_1.2,0.18851200342178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,power_law_1.01,0.07807999849319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,32,power_law_1.2,0.28387200832366943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,32,power_law_1.2,0.276147198677063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,power_law_1.01,0.09139840006828308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,32,power_law_1.2,0.34746880531311036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,power_law_1.01,0.08810240030288696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,power_law_1.01,0.057126402854919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,balanced,1.6180906295776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,32,power_law_1.2,0.39404799938201907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,power_law_1.01,0.06823040246963501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,32,power_law_1.2,0.388371205329895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,balanced,0.47258134682973224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,power_law_1.01,0.07544320225715637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,32,power_law_1.2,0.41814398765563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,power_law_1.01,0.07847679853439331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,32,power_law_1.2,0.4340799808502197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,power_law_1.01,0.08039680123329163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,32,power_law_1.2,0.43016958236694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,power_law_1.01,0.08193920254707336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,32,power_law_1.2,0.44040961265563966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,power_law_1.01,0.0866815984249115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,32,power_law_1.2,0.4508863925933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,power_law_1.01,0.08625919818878174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,balanced,0.6497333447138468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,32,power_law_1.2,0.45067520141601564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,power_law_1.01,0.08983039855957031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,32,power_law_1.2,0.4601408004760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,power_law_1.01,0.09676160216331482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,32,power_law_1.2,0.4515391826629639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,power_law_1.01,0.1012992024421692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,32,power_law_1.2,0.488262414932251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,power_law_1.01,0.11400959491729737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,32,power_law_1.2,0.5155712127685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,power_law_1.01,0.11412479877471923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,32,power_law_1.2,0.6654079914093017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,power_law_1.01,0.12494080066680908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,balanced,2.4086559613545737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,balanced,5.0028533935546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,32,power_law_1.2,0.7371583938598633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,power_law_1.01,0.1492416024208069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,32,power_law_1.2,0.9174464225769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,balanced,0.8685812950134277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,32,power_law_1.2,1.069279956817627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,power_law_1.01,0.160806405544281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,32,power_law_1.2,1.6143999099731445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,32,power_law_1.2,1.741164779663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,power_law_1.01,0.19895039796829223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,power_law_1.01,0.23559679985046386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,32,power_law_1.2,2.4389888763427736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,power_law_1.01,0.3150079965591431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,32,power_law_1.2,3.0399423599243165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,32,power_law_1.2,4.57628173828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,balanced,1.0562293529510498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,power_law_1.01,0.3802880048751831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,32,power_law_1.2,7.35565414428711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,power_law_1.01,0.5477503776550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,32,power_law_1.2,12.553862762451171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,power_law_1.01,0.7403200149536133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,power_law_1.01,1.0787391662597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,power_law_1.01,1.3673855781555175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,power_law_1.01,1.8933504104614258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,32,power_law_1.2,0.21269760131835938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,32,power_law_1.2,0.29523839950561526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,32,power_law_1.2,0.2678656101226807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,power_law_1.01,2.8059520721435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,32,power_law_1.2,0.11125119924545288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,32,power_law_1.2,0.1442304015159607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,power_law_1.01,5.598425674438476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,balanced,4.572335879007976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,32,power_law_1.2,0.18292479515075682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,balanced,1.662757396697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,32,power_law_1.2,0.23242878913879395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,32,power_law_1.2,0.23946878910064698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,32,power_law_1.2,0.25708799362182616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,32,power_law_1.2,0.2595711946487427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,32,power_law_1.2,0.26881918907165525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,32,power_law_1.2,0.2554559946060181
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,32,power_law_1.2,0.2586688041687012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,32,power_law_1.2,0.24641919136047363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,32,power_law_1.2,0.27063679695129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,32,power_law_1.2,0.08247039914131164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,32,power_law_1.2,0.25645439624786376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,32,power_law_1.2,0.0917952001094818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,32,power_law_1.2,0.30001919269561766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,32,power_law_1.2,0.08818560242652893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,32,power_law_1.2,0.3202687978744507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,32,power_law_1.2,0.05729280114173889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,32,power_law_1.2,0.3189888000488281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,32,power_law_1.2,0.06616960167884826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,32,power_law_1.2,0.3946880102157593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,32,power_law_1.2,0.07354879975318909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,32,power_law_1.2,0.07790719866752624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,32,power_law_1.2,0.46613759994506837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,32,power_law_1.2,0.0824512004852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,32,power_law_1.2,0.6055679798126221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,32,power_law_1.2,0.08133760094642639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,32,power_law_1.2,0.7489855766296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,32,power_law_1.2,0.086080002784729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,32,power_law_1.2,1.0847743988037108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,balanced,0.055162668228149414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,32,power_law_1.2,0.08680959939956664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,32,power_law_1.2,1.1385727882385255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,32,power_law_1.2,0.09376000165939331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,balanced,0.05630933245023092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,32,power_law_1.2,1.823206329345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,32,power_law_1.2,0.09181439876556396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,balanced,0.05602133274078369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,32,power_law_1.2,0.10072319507598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,balanced,0.0637066662311554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,32,power_law_1.2,2.4686208724975587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,32,power_law_1.2,0.11217279434204101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,balanced,0.0774186650911967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,balanced,3.2425174713134766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,balanced,0.10866666833559673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,32,power_law_1.2,0.12336000204086303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,32,power_law_1.2,2.7047040939331053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,balanced,0.13617600003878275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,32,power_law_1.2,0.1337280035018921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,balanced,0.13954133788744608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,32,power_law_1.2,4.778323364257813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,32,power_law_1.2,0.1674880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,balanced,0.13684800267219543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,balanced,0.13948800166447958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,32,power_law_1.2,8.777561950683594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,balanced,0.14082133769989014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,32,power_law_1.2,0.1756991982460022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,balanced,0.1443839967250824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,balanced,0.14434666434923807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,32,power_law_1.2,0.19880959987640381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,32,power_law_1.2,0.25566720962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,balanced,0.14681067069371542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,32,power_law_1.2,0.400486421585083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,balanced,0.15261866648991904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,balanced,0.15477866927782694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,32,power_law_1.2,0.4555520057678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,balanced,0.15794666608174643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,32,power_law_1.2,0.6304512023925781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,balanced,0.170415997505188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,balanced,0.17861332496007284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,32,power_law_1.2,0.9761216163635253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,32,power_law_1.2,1.3421119689941405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,balanced,0.20058133204778036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,balanced,0.04864533245563507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,32,power_law_1.2,1.836639976501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,balanced,0.04967466493447622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,balanced,0.22282665967941284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,32,power_law_1.2,2.091212844848633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,balanced,0.04942933221658071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,balanced,0.2661706606547038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,balanced,0.05417066812515259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,32,power_law_1.2,4.204678344726562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,balanced,0.06362133224805196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,balanced,0.08170133332411449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,32,power_law_1.2,8.236377716064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,balanced,0.3028480013211568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,balanced,0.09759466846783955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,balanced,0.09910399715105693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,balanced,0.09927999973297119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,balanced,0.10044800241788228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,balanced,0.10366933544476827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,balanced,0.37854401270548504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,balanced,0.10520000259081523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,balanced,0.10643733541170756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,balanced,0.10855467120806377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,balanced,0.11593066652615865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,balanced,0.4645920197168986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,balanced,0.11840533216794331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,balanced,0.1258240044116974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,balanced,0.14101866881052652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,balanced,0.15465066830317178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,balanced,0.18066134055455527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,balanced,0.6248426834742228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,balanced,0.047797332207361855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,balanced,0.21204266945521036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,balanced,0.04854399959246317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,balanced,0.050288001696268715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,balanced,0.2654293378194173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,balanced,0.054010664423306785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,balanced,0.06815466781457265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,balanced,0.08090133468310039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,balanced,0.3131360014279683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,balanced,0.0997920036315918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,balanced,0.10136000315348308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,balanced,0.8151199817657471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,balanced,0.10219200452168782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.01,0.08621439933776856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,balanced,0.10265599687894185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,balanced,0.41898131370544434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,balanced,0.10474666953086853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.01,0.11141760349273681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,balanced,0.1062453289826711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.01,0.12498559951782226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.01,0.0750976026058197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,balanced,0.1086346705754598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.01,0.08760319948196411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,balanced,0.11091199517250061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.01,0.07875840067863464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,balanced,0.5267999966939291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,balanced,0.1186133325099945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.01,0.05910400152206421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.01,0.09221119880676269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,balanced,0.1195093293984731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.01,0.10586240291595458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.01,0.06395519971847534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.01,0.11054719686508178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,balanced,0.12762666742006937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,balanced,1.007210652033488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.01,0.11391999721527099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.01,0.0716543972492218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,balanced,0.14155733585357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.01,0.118995201587677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.01,0.07921280264854431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.01,0.1136512041091919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,balanced,0.7450239658355713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.01,0.13118720054626465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.01,0.08256000280380249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.01,0.12598400115966796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.01,0.08892800211906433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.01,0.13112319707870485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,balanced,0.15865066647529602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.01,0.08910719752311706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.01,0.137990403175354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.01,0.14422399997711183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.01,0.09344000220298768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.01,0.1437440037727356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.01,0.09745919704437256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.01,0.16591999530792237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.01,0.0949184000492096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.01,0.18089599609375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.01,0.10120320320129395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.01,0.21885440349578858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,balanced,0.9642346700032552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.01,0.11143679618835449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.01,0.250764799118042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,balanced,0.18786666790644327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.01,0.2918720006942749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.01,0.11523840427398682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.01,0.3885440111160278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,balanced,0.21700799465179443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.01,0.12410240173339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.01,0.49912319183349607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,balanced,1.470981280008952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.01,0.1412927985191345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.01,0.6034239768981934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,balanced,0.2725279927253723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.01,0.16531200408935548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.01,0.8273664474487304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.01,0.19527679681777954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.01,1.1712127685546876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.01,0.23313279151916505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.01,1.4253631591796876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.01,0.30439679622650145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,balanced,1.1837813059488933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.01,0.3573568105697632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.01,1.9578176498413087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.01,0.48157439231872556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.01,3.7166080474853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.01,0.6283775806427002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,balanced,0.3497866789499919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.01,0.8669119834899902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,16,power_law_1.2,0.08702719807624817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.01,1.1797696113586427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,balanced,0.4654773473739624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,16,power_law_1.2,0.10252159833908081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.01,1.435923194885254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,power_law_1.01,0.06908159852027893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,16,power_law_1.2,0.0862335979938507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.01,2.272684860229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,16,power_law_1.2,0.06993280053138733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,power_law_1.01,0.08150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,16,power_law_1.2,0.07637760043144226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,power_law_1.01,0.09775999784469605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,balanced,0.6400959889094034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,16,power_law_1.2,0.0864575982093811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.01,4.653619384765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,power_law_1.01,0.0606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,16,power_law_1.2,0.09567999839782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,power_law_1.01,0.06807039976119995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,16,power_law_1.2,0.1089792013168335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,balanced,1.8284692764282227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,power_law_1.01,0.0773248016834259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,16,power_law_1.2,0.11469440460205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,power_law_1.01,0.07846400141716003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,16,power_law_1.2,0.11430399417877198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,power_law_1.01,0.08730239868164062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,balanced,0.8794933160146078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,power_law_1.01,0.08811519742012024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,16,power_law_1.2,0.11860480308532714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,power_law_1.01,0.09304959774017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,16,power_law_1.2,0.12252800464630127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,power_law_1.01,0.09434239864349366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,16,power_law_1.2,0.12290560007095337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,power_law_1.01,0.10122879743576049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,power_law_1.01,0.10242559909820556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,16,power_law_1.2,0.1327232003211975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,power_law_1.01,0.1119871973991394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,16,power_law_1.2,0.14123519659042358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,power_law_1.01,0.12197120189666748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,balanced,2.7874345779418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,power_law_1.01,0.1221824049949646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,16,power_law_1.2,0.1438912034034729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,power_law_1.01,0.14046080112457277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,balanced,1.1630773544311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,16,power_law_1.2,0.14962559938430786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,power_law_1.01,0.17279360294342042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,16,power_law_1.2,0.17524479627609252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,16,power_law_1.2,0.06775040030479432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,16,power_law_1.2,0.18845440149307252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,power_law_1.01,0.18676480054855346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,16,power_law_1.2,0.2348031997680664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,16,power_law_1.2,0.07861760258674622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,16,power_law_1.2,0.26576640605926516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,16,power_law_1.2,0.0711296021938324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,power_law_1.01,0.23313920497894286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,16,power_law_1.2,0.325548791885376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,16,power_law_1.2,0.0581055998802185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,power_law_1.01,0.27746560573577883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,16,power_law_1.2,0.40695037841796877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,16,power_law_1.2,0.060159999132156375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,power_law_1.01,0.41641597747802733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,balanced,1.4255785942077637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,16,power_law_1.2,0.5849919795989991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,16,power_law_1.2,0.07081599831581116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,16,power_law_1.2,0.6829440116882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,16,power_law_1.2,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,power_law_1.01,0.47037439346313475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,16,power_law_1.2,0.906214427947998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,16,power_law_1.2,0.08254079818725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,power_law_1.01,0.6397247791290284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,16,power_law_1.2,1.2483967781066894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,16,power_law_1.2,0.0835968017578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,power_law_1.01,0.8298368453979492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,16,power_law_1.2,1.6013696670532227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,16,power_law_1.2,0.08707839846611024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,power_law_1.01,1.2296128273010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,balanced,3.572688102722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,16,power_law_1.2,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,16,power_law_1.2,2.4060031890869142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,power_law_1.01,1.6576831817626954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,16,power_law_1.2,0.09455999732017517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,16,power_law_1.2,0.09502720236778259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,16,power_law_1.2,4.513907241821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,power_law_1.01,2.009369659423828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,16,power_law_1.2,0.10325119495391846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,power_law_1.01,3.3976192474365234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,16,power_law_1.2,0.11233919858932495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,16,power_law_1.2,0.11299200057983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,power_law_1.01,6.609657287597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,16,power_law_1.2,0.1248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,balanced,2.2329227129618325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,16,power_law_1.2,0.14565759897232056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,16,power_law_1.2,0.16696959733963013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,16,power_law_1.2,0.20449280738830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,16,power_law_1.2,0.24398720264434814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,16,power_law_1.2,0.32311038970947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,16,power_law_1.2,0.37839999198913576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,16,power_law_1.2,0.506009578704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,16,power_law_1.2,0.6661439895629883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,16,power_law_1.2,0.9812288284301758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,16,power_law_1.2,1.3913663864135741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,16,power_law_1.2,1.5421952247619628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,16,power_law_1.2,2.4504831314086912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,16,power_law_1.2,5.350009536743164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,balanced,4.381002744038899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,16,power_law_1.2,0.06884480118751526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,16,power_law_1.2,0.08167679905891419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,balanced,0.05628266433874766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,16,power_law_1.2,0.0687936007976532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,balanced,0.05585066477457682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,balanced,0.057071998715400696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,16,power_law_1.2,0.06069759726524353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,balanced,0.06725866595904033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,16,power_law_1.2,0.06501759886741638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,balanced,0.07903466622034709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,16,power_law_1.2,0.0730239987373352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,balanced,0.11171199878056844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,balanced,0.14223466316858926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,16,power_law_1.2,0.07687039971351624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,balanced,0.14379733800888062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,balanced,0.04888000090916952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,16,power_law_1.2,0.08674560189247131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,balanced,0.14285866419474283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,balanced,0.1460693379243215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,16,power_law_1.2,0.08469120264053345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,balanced,0.0491839994986852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,balanced,0.14628266294797262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,balanced,0.050842667619387306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,16,power_law_1.2,0.09207040071487427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,balanced,0.1504639983177185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,balanced,0.05629866818586985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,16,power_law_1.2,0.09257599711418152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,balanced,0.15130666891733804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,balanced,0.06559466818968455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,balanced,0.1543839971224467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,16,power_law_1.2,0.09748479723930359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,balanced,0.16044800480206808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,balanced,0.09007466832796733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,16,power_law_1.2,0.1035647988319397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,balanced,0.1655786633491516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,balanced,0.11037866274515788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,16,power_law_1.2,0.10885759592056274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,balanced,0.17019732793172201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,balanced,0.10959466298421223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,16,power_law_1.2,0.1207808017730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,balanced,0.11044266819953918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,balanced,0.18705066045125326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,balanced,0.11242666840553284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,16,power_law_1.2,0.12666879892349242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,balanced,0.1997119983037313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,balanced,0.11367467045783997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,balanced,0.22900267442067465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,16,power_law_1.2,0.14773759841918946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,balanced,0.11539733409881592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,balanced,0.11821867028872173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,balanced,0.255023996035258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,16,power_law_1.2,0.1770624041557312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,balanced,0.11906133095423381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,balanced,0.12929600477218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,balanced,0.30499200026194256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,balanced,0.13193066914876303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,16,power_law_1.2,0.19661439657211305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,balanced,0.14028799533843994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,balanced,0.3643093506495158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,balanced,0.1565600037574768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,16,power_law_1.2,0.2280128002166748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,balanced,0.17351466417312622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,balanced,0.4844213326772054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,16,power_law_1.2,0.287827205657959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.01,0.06700800061225891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,balanced,0.208021342754364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,16,power_law_1.2,0.4329216003417969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.01,0.08432639837265014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,balanced,0.24193066358566284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.01,0.1118399977684021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.01,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,balanced,0.5935786565144857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,16,power_law_1.2,0.49767680168151857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.01,0.0770687997341156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,balanced,0.30027733246485394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,balanced,0.05190933247407278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.01,0.09297279715538025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,16,power_law_1.2,0.7835519790649415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.01,0.09415040016174317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,balanced,0.05486399928728739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.01,0.11654399633407593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,16,power_law_1.2,1.0465215682983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,balanced,0.05719999969005585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,balanced,0.36869335174560547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.01,0.1184000015258789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.01,0.05482239723205566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,balanced,0.06337066491444905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.01,0.12588800191879274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,16,power_law_1.2,1.409785556793213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,balanced,0.07409066458543141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.01,0.0665727972984314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,balanced,0.8324213027954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.01,0.12526079416275024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,balanced,0.09493333101272583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,16,power_law_1.2,2.14401912689209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,balanced,0.5080853303273519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.01,0.1233024001121521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.01,0.08076800107955932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,balanced,0.11596266428629558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.01,0.1293887972831726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,16,power_law_1.2,2.6057472229003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,balanced,0.11806933085123698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.01,0.058406400680541995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.01,0.13497600555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,balanced,0.11917866269747417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.01,0.1522879958152771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.01,0.06480640172958374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,16,power_law_1.2,3.7189823150634767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,balanced,0.12131200234095256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.01,0.15345920324325563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,balanced,0.6424640019734701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.01,0.16643840074539185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,balanced,0.12223999698956807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.01,0.07268480062484742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.01,0.18290560245513915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,balanced,0.12577600280443826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,16,power_law_1.2,8.41502685546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.01,0.08149759769439698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.01,0.20346240997314452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,balanced,1.06660262743632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,balanced,0.12909866372744241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.01,0.24563839435577392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.01,0.08877440094947815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,balanced,0.13214932878812155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.01,0.2752959966659546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.01,0.0923520028591156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,balanced,0.1421173314253489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.01,0.33841919898986816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,balanced,0.14432533582051596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.01,0.09416319727897644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.01,0.4086912155151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,balanced,0.9194293022155762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.01,0.5419712066650391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,balanced,0.15711466471354166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.01,0.09994879961013795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.01,0.7115968227386474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,balanced,0.17409066359202066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.01,0.10290559530258178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,power_law_1.01,0.0649728000164032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.01,0.9659711837768554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.01,0.10671360492706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.01,1.2207936286926269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,power_law_1.01,0.07561600208282471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,balanced,1.2716373602549236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,power_law_1.01,0.09652479887008666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.01,0.11311999559402466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.01,1.5601984024047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,power_law_1.01,0.06843519806861878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.01,0.12263679504394531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,balanced,0.19991467396418253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,balanced,1.1772533257802327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.01,2.4794687271118163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,power_law_1.01,0.07640960216522216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.01,0.12910720109939575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,power_law_1.01,0.08463360071182251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.01,0.1419327974319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,8,power_law_1.2,0.06737279891967773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.01,4.760121536254883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,power_law_1.01,0.09257599711418152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.01,0.16764800548553466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,power_law_1.01,0.10168319940567017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,8,power_law_1.2,0.08452479839324951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.01,0.17968000173568727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,power_law_1.01,0.10430719852447509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.01,0.22407679557800292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,8,power_law_1.2,0.0809216022491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,power_law_1.01,0.10740480422973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,balanced,0.26203733682632446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.01,0.2515968084335327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,power_law_1.01,0.11088639497756958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,8,power_law_1.2,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.01,0.3404416084289551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,balanced,0.31825600067774457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,power_law_1.01,0.11611520051956177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,8,power_law_1.2,0.07672960162162781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.01,0.40943360328674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,power_law_1.01,0.12074240446090698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,balanced,1.446181297302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,8,power_law_1.2,0.0834879994392395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,balanced,0.40004801750183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.01,0.5357120037078857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,power_law_1.01,0.13151999711990356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,8,power_law_1.2,0.09260799884796142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,balanced,1.943050702412923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.01,0.7310527801513672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,power_law_1.01,0.14535679817199706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,balanced,0.5163466533025106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,8,power_law_1.2,0.1071936011314392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.01,1.023033618927002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,power_law_1.01,0.15234559774398804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,power_law_1.01,0.17052799463272095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,8,power_law_1.2,0.11137280464172364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.01,1.3221759796142578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.01,1.6481920242309571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,8,power_law_1.2,0.11667200326919555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,power_law_1.01,0.21206400394439698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,balanced,0.6875200271606445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,8,power_law_1.2,0.12208000421524048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.01,2.5476543426513674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,8,power_law_1.2,0.12366080284118652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,power_law_1.01,0.23838720321655274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.01,5.273510360717774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,8,power_law_1.2,0.13112319707870485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,balanced,0.9388853708902994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,8,power_law_1.2,0.1425536036491394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,power_law_1.01,0.3060287952423096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,8,power_law_1.2,0.1548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,power_law_1.01,0.37798399925231935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,8,power_law_1.2,0.15783679485321045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,balanced,2.2498292922973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,power_law_1.01,0.5208127975463868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,8,power_law_1.2,0.16314239501953126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,power_law_1.01,0.651801586151123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,8,power_law_1.2,0.18492159843444825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,balanced,1.2913866837819417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,power_law_1.01,0.8871616363525391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,8,power_law_1.2,0.20671360492706298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,power_law_1.01,1.1344127655029297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,8,power_law_1.2,0.24897921085357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,power_law_1.01,1.741868782043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,8,power_law_1.2,0.284006404876709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,power_law_1.01,2.2065216064453126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,8,power_law_1.2,0.36953599452972413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,power_law_1.01,2.7758655548095703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,balanced,1.7347092628479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,8,power_law_1.2,0.44434561729431155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,power_law_1.01,4.496217727661133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,8,power_law_1.2,0.5683199882507324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,8,power_law_1.2,0.798521614074707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,power_law_1.01,8.508460998535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,balanced,3.809098561604818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,8,power_law_1.2,1.041823959350586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,8,power_law_1.2,1.4390912055969238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,8,power_law_1.2,1.7582399368286132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,balanced,2.148746649424235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,8,power_law_1.2,3.0391616821289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,8,power_law_1.2,6.684012603759766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,balanced,4.422197341918945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,balanced,3.3605705897013345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,8,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,8,power_law_1.2,0.06641280055046081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,8,power_law_1.2,0.05928959846496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,8,power_law_1.2,0.05904639959335327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,8,power_law_1.2,0.06421120166778564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,8,power_law_1.2,0.06934400200843811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,8,power_law_1.2,0.07793279886245727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,8,power_law_1.2,0.08810880184173583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,8,power_law_1.2,0.0913536012172699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,8,power_law_1.2,0.09304959774017334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,8,power_law_1.2,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,8,power_law_1.2,0.10268160104751586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,8,power_law_1.2,0.10537600517272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,8,power_law_1.2,0.11395200490951538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,8,power_law_1.2,0.06433280110359192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,8,power_law_1.2,0.12332799434661865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,8,power_law_1.2,0.13226879835128785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,balanced,6.602415720621745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,8,power_law_1.2,0.07548800110816956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,8,power_law_1.2,0.14534399509429932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,8,power_law_1.2,0.06963840126991272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,8,power_law_1.2,0.17464319467544556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,8,power_law_1.2,0.18392319679260255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,8,power_law_1.2,0.06743040084838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,8,power_law_1.2,0.23569920063018798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,8,power_law_1.2,0.07255039811134338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,8,power_law_1.2,0.2690943956375122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,8,power_law_1.2,0.08311039805412293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,8,power_law_1.2,0.3406847953796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,8,power_law_1.2,0.08803200125694274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,8,power_law_1.2,0.4413760185241699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,8,power_law_1.2,0.09820799827575684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,8,power_law_1.2,0.10396159887313842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,8,power_law_1.2,0.6333439826965332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,balanced,0.05657066901524862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,8,power_law_1.2,0.10442240238189697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,8,power_law_1.2,0.7883071899414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,balanced,0.05805333455403646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,balanced,0.05968533456325531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,8,power_law_1.2,0.1087231993675232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,8,power_law_1.2,1.240332794189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,balanced,0.08546132842699687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,8,power_law_1.2,0.11661440134048462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,balanced,0.09797867139180501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,8,power_law_1.2,1.4218111991882325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,8,power_law_1.2,0.12140159606933594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,balanced,0.1295840044816335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,8,power_law_1.2,1.7491840362548827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,balanced,0.16100266575813293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,8,power_law_1.2,0.13178240060806273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,balanced,0.1550879975159963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,8,power_law_1.2,0.14550399780273438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,8,power_law_1.2,2.9511104583740235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,balanced,0.1548746625582377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,8,power_law_1.2,0.1534783959388733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,balanced,0.1585706671079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,8,power_law_1.2,0.1788480043411255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,8,power_law_1.2,6.172415924072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,balanced,0.15738133589426676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,balanced,0.16127467155456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,8,power_law_1.2,0.2137279987335205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,balanced,0.1648319959640503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,balanced,0.1670773426691691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,balanced,0.17638399203618368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,8,power_law_1.2,0.26116480827331545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,balanced,0.18101332585016885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,balanced,0.18631466229756674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,8,power_law_1.2,0.3192255973815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,balanced,0.20851200819015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,8,power_law_1.2,0.4207168102264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,balanced,0.22417600949605307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,8,power_law_1.2,0.5335807800292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,balanced,0.05041599770387014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,8,power_law_1.2,0.7152639865875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,balanced,0.262773334980011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,balanced,0.052111998200416565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,8,power_law_1.2,0.969753646850586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,balanced,0.05500266452630361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,balanced,0.3268959919611613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,balanced,0.06147199869155884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,8,power_law_1.2,1.4036160469055177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,balanced,0.0814879983663559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,balanced,0.11241599917411804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,balanced,0.4099946816762288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,8,power_law_1.2,2.0175743103027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,balanced,0.14113066593805948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,8,power_law_1.2,2.566649627685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,balanced,0.13865066568056741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,balanced,0.1404906709988912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,balanced,0.5017386674880981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,8,power_law_1.2,3.2515838623046873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,balanced,0.14249599973360697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,balanced,0.1436906655629476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,balanced,0.14865600069363913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,8,power_law_1.2,5.114547348022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.01,0.05930240154266357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.01,0.053260797262191774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,balanced,0.15078933040301004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,balanced,0.6995786825815836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,balanced,0.151829332113266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.01,0.07896320223808288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.01,0.06060799956321716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,8,power_law_1.2,10.219654083251953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,balanced,0.1642400026321411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.01,0.088646399974823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.01,0.07571200132369996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,balanced,0.16410133242607117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.01,0.07599999904632568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,balanced,0.1743519902229309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.01,0.06487039923667907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.01,0.08810880184173583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,balanced,0.8731040159861246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,balanced,0.1930239995320638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.01,0.10173439979553223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.01,0.07605119943618774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,balanced,0.21963733434677124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.01,0.11259520053863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.01,0.08850560188293458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,balanced,0.2645866672197978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.01,0.12420480251312256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.01,0.12888959646224976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.01,0.09675520062446594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,balanced,0.3126453359921773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.01,0.1338495969772339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,balanced,1.2510933081309001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.01,0.1131327986717224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.01,0.1377087950706482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,balanced,0.39339200655619305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.01,0.11547520160675048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.01,0.14335999488830567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.01,0.11915520429611207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.01,0.14658559560775758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.01,0.12388479709625244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,balanced,0.49590933322906494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.01,0.15605759620666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.01,0.12963839769363403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.01,0.16684160232543946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.01,0.13701119422912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.01,0.17271039485931397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.01,0.14175360202789306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,balanced,0.7019946575164795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,balanced,1.5543626149495442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.01,0.1873792052268982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.01,0.15319039821624755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.01,0.21760001182556152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.01,0.1615231990814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.01,1.4355775833129882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.01,0.16811519861221313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.01,1.4865535736083983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.01,0.20941441059112548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,balanced,0.892789363861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.01,0.23646080493927002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.01,0.3435647964477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.01,0.2981247901916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.01,0.4187903881072998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.01,0.3299520015716553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.01,0.5647103786468506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.01,0.4136767864227295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.01,0.7390719890594483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.01,0.5425983905792237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,balanced,1.8930346171061199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.01,0.9299967765808106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,balanced,1.3011093139648438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.01,0.7440576076507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.01,1.4069888114929199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.01,0.9174336433410645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.01,1.7227455139160157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.01,1.3733887672424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.01,2.1185279846191407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.01,1.7520832061767577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.01,3.1321792602539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.01,2.152204895019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.01,6.9940544128417965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.01,3.464467239379883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,balanced,1.6376105944315593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.01,6.97790756225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,balanced,2.9460318883260093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,balanced,2.035989284515381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,balanced,3.1587626139322915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,4,power_law_1.2,0.05928959846496582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,4,power_law_1.2,0.07917439937591553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,4,power_law_1.2,0.06824960112571717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,4,power_law_1.2,0.07341439723968506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,4,power_law_1.2,0.08453119993209839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,4,power_law_1.2,0.0995136022567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,4,power_law_1.2,0.10683519840240478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,4,power_law_1.2,0.1198464035987854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,4,power_law_1.2,0.12776319980621337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,4,power_law_1.2,0.13484159708023072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,balanced,5.703114827473958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,4,power_law_1.2,0.14022400379180908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,4,power_law_1.2,0.14149119853973388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,4,power_law_1.2,0.1473855972290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,4,power_law_1.2,0.1561535954475403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,4,power_law_1.2,0.16663680076599122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,4,power_law_1.2,0.17556480169296265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,4,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,4,power_law_1.2,0.18967679738998414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,4,power_law_1.2,0.0606719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,4,power_law_1.2,0.22070400714874266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,4,power_law_1.2,0.061363202333450315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,4,power_law_1.2,1.4475071907043457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,4,power_law_1.2,1.5052736282348633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,4,power_law_1.2,0.06317440271377564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,4,power_law_1.2,0.34707839488983155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,4,power_law_1.2,0.07428479790687562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,4,power_law_1.2,0.4484288215637207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,4,power_law_1.2,0.5607232093811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,4,power_law_1.2,0.08367999792098998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,4,power_law_1.2,0.7618175983428955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,4,power_law_1.2,0.08852480053901672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,4,power_law_1.2,0.9474559783935547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,4,power_law_1.2,0.11012480258941651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,4,power_law_1.2,1.3917311668395995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,balanced,6.328421274820964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,4,power_law_1.2,0.11302399635314941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,4,power_law_1.2,2.0298303604125976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,4,power_law_1.2,0.11632640361785888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,4,power_law_1.2,2.2955648422241213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,4,power_law_1.2,0.11998080015182495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,4,power_law_1.2,0.12361600399017333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,4,power_law_1.2,3.456300735473633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,4,power_law_1.2,0.13199360370635987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,4,power_law_1.2,0.14209280014038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,4,power_law_1.2,7.137760162353516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,4,power_law_1.2,0.15576319694519042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,4,power_law_1.2,0.16575360298156738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,4,power_law_1.2,0.17783679962158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,4,power_law_1.2,0.21152639389038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,4,power_law_1.2,0.2460927963256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,4,power_law_1.2,0.29789440631866454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,4,power_law_1.2,0.34669439792633056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,4,power_law_1.2,0.43528318405151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,4,power_law_1.2,0.5748799800872803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,4,power_law_1.2,0.7830143928527832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,4,power_law_1.2,0.9991040229797363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,4,power_law_1.2,1.4567423820495606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,4,power_law_1.2,1.8987327575683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,balanced,0.052149335543314614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,4,power_law_1.2,2.218662452697754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,power_law_1.01,0.05115519762039185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,balanced,0.05310933291912079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,balanced,0.05339199801286062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,4,power_law_1.2,3.7935039520263674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,balanced,0.05971199770768484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,power_law_1.01,0.05137919783592224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,balanced,0.07119999825954437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,4,power_law_1.2,8.152838134765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,power_law_1.01,0.05671039819717407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,balanced,0.0872373382250468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,power_law_1.01,0.06023039817810059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,balanced,0.07805866499741872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,power_law_1.01,0.07234560251235962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,balanced,0.07909333209196727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,power_law_1.01,0.07384960055351257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,balanced,0.09313600262006123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,power_law_1.01,0.07159680128097534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,balanced,0.09236799677213033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,balanced,0.09564266602198283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,power_law_1.01,0.08394880294799804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,balanced,0.08571199576059978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,power_law_1.01,0.08410239815711976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,balanced,0.08745599786440532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,power_law_1.01,0.08461440205574036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,balanced,0.08736532926559448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,1,128,power_law_1.2,0.05189759731292724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,power_law_1.01,0.08480640053749085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,balanced,0.08779199918111165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,1,128,power_law_1.2,0.052928000688552856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,power_law_1.01,0.08652160167694092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,balanced,0.08948266506195068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,1,128,power_law_1.2,0.052083200216293334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,power_law_1.01,0.08600320219993592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,balanced,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,1,128,power_law_1.2,0.0567359983921051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,balanced,0.09330667058626811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,power_law_1.01,0.08844159841537476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,1,128,power_law_1.2,0.06105599999427795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,balanced,0.09859733780225118
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,power_law_1.01,0.09066879749298096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,1,128,power_law_1.2,0.07181439995765686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,power_law_1.01,0.09563519954681396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,balanced,0.10521599650382996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,power_law_1.01,0.10274560451507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,1,128,power_law_1.2,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,balanced,0.11421866218249004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,power_law_1.01,0.128057599067688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,1,128,power_law_1.2,0.07200000286102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,balanced,0.12968533237775168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,power_law_1.01,0.14897279739379882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,1,128,power_law_1.2,0.08444160223007202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,power_law_1.01,0.20439679622650148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,1,128,power_law_1.2,0.08469120264053345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,balanced,0.14916266997655234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,balanced,0.04584533472855886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,power_law_1.01,0.2445823907852173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,1,128,power_law_1.2,0.08506879806518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,balanced,0.046906664967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,power_law_1.01,0.3728960037231445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,1,128,power_law_1.2,0.08525440096855164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,balanced,0.19642666975657144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,balanced,0.04752533137798309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,1,128,power_law_1.2,0.0858560025691986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,power_law_1.01,0.4439040184020996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,balanced,0.04730133215586344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,1,128,power_law_1.2,0.08712319731712341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,power_law_1.01,0.739743995666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,balanced,0.23466134071350098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,balanced,0.052095999320348106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,power_law_1.01,0.9379520416259766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,1,128,power_law_1.2,0.0869376003742218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,balanced,0.05972266693909963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,1,128,power_law_1.2,0.0878271996974945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,power_law_1.01,1.2148032188415527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,balanced,0.06693866848945618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,balanced,0.3325279951095581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,1,128,power_law_1.2,0.09308800101280212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,balanced,0.06855466465155284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,power_law_1.01,1.8203519821166991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,balanced,0.07366399963696797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,1,128,power_law_1.2,0.10510720014572143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,power_law_1.01,4.018815994262695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,balanced,0.07376533250013988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,1,128,power_law_1.2,0.121343994140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,balanced,0.0720960001150767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,1,128,power_law_1.2,0.1428928017616272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,balanced,0.43245331446329754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,balanced,0.06903466582298279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,1,128,power_law_1.2,0.17455999851226806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,balanced,0.07107200225194295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,1,128,power_law_1.2,0.25583999156951903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,power_law_1.01,0.053855997323989865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,balanced,0.07031466563542683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,balanced,0.07082133491834004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,power_law_1.01,0.04899199903011322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,1,128,power_law_1.2,0.34878079891204833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,balanced,0.07170133292675018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,balanced,0.5351839860280355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,1,128,power_law_1.2,0.5528895854949951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,power_law_1.01,0.04807040095329285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,balanced,0.07257600128650665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,power_law_1.01,0.051769602298736575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,1,128,power_law_1.2,0.7121984004974365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,balanced,0.07699200014273326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,power_law_1.01,0.0595583975315094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,64,power_law_1.2,0.05248640179634094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,1,128,power_law_1.2,1.1234623908996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,power_law_1.01,0.06332160234451294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,balanced,0.07965333263079326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,64,power_law_1.2,0.04745599925518036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,1,128,power_law_1.2,1.4457792282104491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,power_law_1.01,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,balanced,0.08890666564305623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,64,power_law_1.2,0.04581120014190674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,power_law_1.01,0.06813439726829529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,1,128,power_law_1.2,1.6924736022949218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,64,power_law_1.2,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,balanced,0.0974133312702179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,power_law_1.01,0.06824319958686828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,64,power_law_1.2,0.05109120011329651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,balanced,0.841877301534017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,1,128,power_law_1.2,3.589446258544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,power_law_1.01,0.06813439726829529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,64,power_law_1.2,0.05667200088500977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,balanced,0.11281599601109822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,64,power_law_1.2,0.0632960021495819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,power_law_1.2,6.041567993164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,power_law_1.01,0.06863999962806702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,64,power_law_1.2,0.0641152024269104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,balanced,0.12871467073758444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,power_law_1.01,0.06937599778175355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,64,power_law_1.2,0.06747519969940186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,power_law_1.01,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,64,power_law_1.2,0.06801279783248901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,balanced,0.1781066656112671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,power_law_1.01,0.0725823998451233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,64,power_law_1.2,0.06828799843788147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,power_law_1.01,0.07055360078811646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,64,power_law_1.2,0.06992639899253845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,power_law_1.01,0.07483519911766053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,balanced,0.21709332863489786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,64,power_law_1.2,0.07088639736175537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,power_law_1.01,0.07899519801139832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,64,power_law_1.2,0.07180160284042358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,power_law_1.01,0.08268799781799316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,64,power_law_1.2,0.0716480016708374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,power_law_1.01,0.10094720125198364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,balanced,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,64,power_law_1.2,0.06996480226516724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,balanced,0.3149706721305847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,64,power_law_1.2,0.07452800273895263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,power_law_1.01,0.11003520488739013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,balanced,0.03484266748030981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,balanced,0.03517866631348928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,1,128,balanced,1.6598560015360515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,64,power_law_1.2,0.08144000172615051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,power_law_1.01,0.1591871976852417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,balanced,0.037802666425704956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,64,power_law_1.2,0.085971200466156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,power_law_1.01,0.2110975980758667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,balanced,0.043509334325790405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,balanced,0.40831466515858966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,balanced,0.04641066491603851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,64,power_law_1.2,0.1172287940979004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,power_law_1.01,0.2798527956008911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,64,power_law_1.2,0.14187519550323485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,balanced,0.04959466556708018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,power_law_1.01,0.35946240425109866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,64,power_law_1.2,0.2211967945098877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,power_law_1.01,0.03586559891700745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,balanced,0.05318933228651682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,power_law_1.01,0.5352128028869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,64,power_law_1.2,0.2486016035079956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,balanced,0.06243733565012614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,power_law_1.01,0.7516096115112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,power_law_1.01,0.03676159977912903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,64,power_law_1.2,0.32312960624694825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,balanced,0.06284266710281372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,balanced,0.5031786759694418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,64,power_law_1.2,0.4901951789855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,power_law_1.01,1.0530752182006835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,power_law_1.01,0.035436800122261046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,balanced,0.05985066791375478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,64,power_law_1.2,0.7965119838714599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,power_law_1.01,1.548755168914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,power_law_1.01,0.039552000164985654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,64,power_law_1.2,0.9824128150939941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,balanced,0.05862933397293091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,power_law_1.01,2.77960319519043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,power_law_1.01,0.04217599928379059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,64,power_law_1.2,1.37139835357666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,balanced,0.06242666641871134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,power_law_1.01,0.045433598756790164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,balanced,0.06176533301671346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,power_law_1.2,2.1540224075317385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,power_law_1.01,0.04888960123062134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,balanced,0.06253333389759064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,power_law_1.2,4.7888641357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,power_law_1.01,0.051846402883529666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,balanced,0.06353066861629486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,64,balanced,0.7877653439839681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,power_law_1.01,0.061459201574325564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,balanced,0.06369066735108693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,power_law_1.01,0.06296319961547851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,balanced,0.06736533343791962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,power_law_1.01,0.06130560040473938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,balanced,0.07082133491834004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,power_law_1.01,0.05927680134773254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,balanced,0.08105599880218506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,power_law_1.01,0.0609279990196228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,balanced,0.09032000104586284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,power_law_1.01,0.06505600214004517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,power_law_1.01,0.06577280163764954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,balanced,0.10858666896820068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,power_law_1.01,0.06455039978027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,balanced,0.12703999876976013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,power_law_1.01,0.06920959949493408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,power_law_1.01,0.07082880139350892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,balanced,0.17360534270604452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,power_law_1.01,0.07774720191955567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,64,balanced,1.552853266398112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,power_law_1.01,0.09464960098266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,balanced,0.21137599150339761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,power_law_1.01,0.10396800041198731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,power_law_1.01,0.15055999755859376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,power_law_1.01,0.17525119781494142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,balanced,0.30538666248321533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,power_law_1.01,0.24651520252227782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,power_law_1.01,0.3136255979537964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,power_law_1.01,0.46192641258239747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,balanced,0.3943093220392863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,power_law_1.01,0.5680704116821289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,power_law_1.01,0.7712831974029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,power_law_1.01,1.0621824264526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,balanced,0.48505600293477374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,power_law_1.01,2.390950393676758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,32,power_law_1.2,0.035820800065994265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,32,power_law_1.2,0.03771519958972931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,32,power_law_1.2,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,32,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,32,power_law_1.2,0.042419201135635375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,balanced,0.7624533176422119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,32,power_law_1.2,0.04565759897232056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,32,power_law_1.2,0.048876801133155824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,32,power_law_1.2,0.05187839865684509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,32,power_law_1.2,0.061324799060821535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,32,power_law_1.2,0.05883520245552063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,32,power_law_1.2,0.057708799839019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,32,power_law_1.2,0.061536002159118655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,32,power_law_1.2,0.06375679969787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,balanced,0.03035733352104823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,32,power_law_1.2,0.06398720145225525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,balanced,0.03290133426586787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,32,power_law_1.2,0.06631039977073669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,balanced,0.033189333975315094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,32,power_law_1.2,0.06539520025253295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,balanced,0.03454400102297465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,32,power_law_1.2,0.06632959842681885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,balanced,0.03732266773780187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,32,power_law_1.2,0.08247039914131164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,balanced,1.4948107401529949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,balanced,0.0383840004603068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,power_law_1.01,0.03128960132598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,32,power_law_1.2,0.09215999841690063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,balanced,0.04248000184694926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,32,power_law_1.2,0.09795839786529541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,power_law_1.01,0.035667198896408084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,balanced,0.04139200101296107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,power_law_1.01,0.03269760012626648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,32,power_law_1.2,0.1251520037651062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,balanced,0.04667733112970988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,power_law_1.01,0.0354559987783432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,32,power_law_1.2,0.16246399879455567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,balanced,0.04829333225886027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,power_law_1.01,0.037376001477241516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,32,power_law_1.2,0.19191039800643922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,balanced,0.04562666515509287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,power_law_1.01,0.03758080005645752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,32,power_law_1.2,0.28504319190979005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,32,power_law_1.2,0.4162879943847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,balanced,0.06422399977842967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,power_law_1.01,0.03984639942646027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,32,power_law_1.2,0.6198783874511719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,balanced,0.05927466849486033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,power_law_1.01,0.046598398685455324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,32,power_law_1.2,0.7819839954376221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,balanced,0.06058133145173391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,power_law_1.01,0.0480320006608963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,32,power_law_1.2,0.9023807525634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,balanced,0.06498133142789204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,power_law_1.01,0.04482559859752655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,32,power_law_1.2,1.5482943534851075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,power_law_1.01,0.06394879817962647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,balanced,0.06655466556549072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,power_law_1.01,0.06455680131912231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,balanced,0.028079998989899952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,balanced,0.07232533395290375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,32,power_law_1.2,2.8082752227783203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,16,power_law_1.2,0.031148800253868104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,power_law_1.01,0.060736000537872314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,balanced,0.029850666721661884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,balanced,0.07425066828727722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,16,power_law_1.2,0.0353408008813858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,balanced,0.03044266750415166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,power_law_1.01,0.0607807993888855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,balanced,0.03440000116825104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,16,power_law_1.2,0.03253119885921478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,balanced,0.08518399794896443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,power_law_1.01,0.06823040246963501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,16,power_law_1.2,0.035724800825119016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,power_law_1.01,0.0687936007976532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,balanced,0.0384853333234787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,balanced,0.09358933568000793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,16,power_law_1.2,0.03656319975852966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,balanced,0.039221333960692085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,power_law_1.01,0.07562239766120911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,16,power_law_1.2,0.037011200189590455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,balanced,0.0391839991013209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,balanced,0.11236266295115153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,power_law_1.01,0.07889919877052307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,balanced,0.04304533203442892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,16,power_law_1.2,0.041382399201393125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,power_law_1.01,0.08814079761505127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,balanced,0.041434665520985924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,balanced,0.1311840017636617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,16,power_law_1.2,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,balanced,0.04155199974775314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,power_law_1.01,0.10316159725189208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,16,power_law_1.2,0.046854400634765626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,balanced,0.050570666790008545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,power_law_1.01,0.13372160196304322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,16,power_law_1.2,0.04671359956264496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,balanced,0.17779199282328287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,balanced,0.04842133323351542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,16,power_law_1.2,0.04538240134716034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,power_law_1.01,0.16755839586257934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,power_law_1.01,0.2215872049331665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,balanced,0.048911998669306435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,16,power_law_1.2,0.06292480230331421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,power_law_1.01,0.028601598739624024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,power_law_1.01,0.30524160861968996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,balanced,0.06971199810504913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,balanced,0.21242666244506836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,16,power_law_1.2,0.06279039978981019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,power_law_1.01,0.41661438941955564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,power_law_1.01,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,balanced,0.063701331615448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,16,power_law_1.2,0.05928320288658142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,power_law_1.01,0.5243968009948731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,power_law_1.01,0.029817599058151244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,balanced,0.06663999954859416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,16,power_law_1.2,0.06378880143165588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,power_law_1.01,0.6554944038391113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,power_law_1.01,0.033036801218986514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,16,power_law_1.2,0.06912000179290771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,balanced,0.07869866490364075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,balanced,0.3136639992396037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,power_law_1.01,1.0253567695617676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,power_law_1.01,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,16,power_law_1.2,0.07254400253295898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,balanced,0.08151466647783916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,power_law_1.01,2.0281919479370116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,power_law_1.01,0.036447998881340024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,16,power_law_1.2,0.07786880135536194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,balanced,0.09249599774678548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,16,power_law_1.2,0.08138239979743958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,power_law_1.01,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,balanced,0.10048000017801921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,16,power_law_1.2,0.09404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,balanced,0.3951733509699504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,16,power_law_1.2,0.1081279993057251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,balanced,0.11946133772532146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,power_law_1.01,0.04141440093517303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,16,power_law_1.2,0.14601600170135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,power_law_1.01,0.04094719886779785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,balanced,0.13869866728782654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,16,power_law_1.2,0.18655359745025635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,power_law_1.01,0.04085119962692261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,16,power_law_1.2,0.2760512113571167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,power_law_1.01,0.04966399967670441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,balanced,0.4864319960276286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,16,power_law_1.2,0.33578879833221437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,balanced,0.19339199860890707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,8,power_law_1.2,0.028870400786399842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,power_law_1.01,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,16,power_law_1.2,0.5015359878540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,power_law_1.01,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,8,power_law_1.2,0.03280639946460724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,16,power_law_1.2,0.5938176155090332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,balanced,0.23132266600926718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,power_law_1.01,0.06988800168037415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,8,power_law_1.2,0.02930560111999512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,16,power_law_1.2,0.7605696201324463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,8,power_law_1.2,0.03377279937267304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,power_law_1.01,0.06871680021286011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,power_law_1.2,1.2977984428405762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,8,power_law_1.2,0.03651840090751648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,power_law_1.01,0.0716543972492218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,power_law_1.2,2.514579200744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,balanced,0.3383893171946208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,8,power_law_1.2,0.036236798763275145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,power_law_1.01,0.08024320006370544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,8,power_law_1.2,0.038047999143600464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,16,balanced,0.7584426403045654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,power_law_1.01,0.08773760199546814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,8,power_law_1.2,0.0385919988155365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,power_law_1.01,0.09696000218391418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,8,power_law_1.2,0.041657599806785586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,power_law_1.01,0.11192959547042847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,balanced,0.43235735098520917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,8,power_law_1.2,0.041222399473190306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,power_law_1.01,0.1459264039993286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,8,power_law_1.2,0.04142079949378967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,power_law_1.01,0.17932800054550171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,8,power_law_1.2,0.05043839812278748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,power_law_1.01,0.24518399238586425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,8,power_law_1.2,0.04812160134315491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,power_law_1.01,0.3088320016860962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,8,power_law_1.2,0.051801598072052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,balanced,0.5358933210372925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,power_law_1.01,0.4195456027984619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,8,power_law_1.2,0.07207679748535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,8,power_law_1.2,0.06841599941253662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,power_law_1.01,0.5449664115905761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,8,power_law_1.2,0.08165119886398316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,power_law_1.01,0.680518388748169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,8,power_law_1.2,0.08354560136795045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,power_law_1.01,1.029695987701416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,8,power_law_1.2,0.09015039801597595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,power_law_1.01,2.034111976623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,8,power_law_1.2,0.10421760082244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,16,balanced,1.4908746083577473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,8,power_law_1.2,0.11853439807891845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,balanced,0.8363306522369385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,balanced,0.02714666724205017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,8,power_law_1.2,0.14916479587554932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,balanced,0.028629332780838013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,8,power_law_1.2,0.18542079925537108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,balanced,0.029706666866938274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,8,power_law_1.2,0.2725183963775635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,balanced,0.03253333270549774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,8,power_law_1.2,0.3405440092086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,balanced,0.03642133375008901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,8,power_law_1.2,0.46255998611450194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,balanced,0.040709334115187325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,balanced,0.04112533231576284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,8,power_law_1.2,0.5964608192443848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,balanced,0.04013866682847341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,8,power_law_1.2,0.7199103832244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,balanced,0.041375999649365745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,balanced,0.0410453329483668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,8,power_law_1.2,1.193056011199951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,balanced,0.041877334316571556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,balanced,1.6329174041748047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,8,power_law_1.2,2.4173952102661134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,balanced,0.045034666856129967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,power_law_1.01,0.02768639922142029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,balanced,0.04448533554871877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,power_law_1.01,0.029497599601745604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,balanced,0.04486933350563049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,power_law_1.01,0.02898559868335724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,balanced,0.05364799996217092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,power_law_1.01,0.03261440098285675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,balanced,0.05199466645717621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,balanced,0.05482666691144308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,power_law_1.01,0.035411199927330016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,balanced,0.08142933249473572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,power_law_1.01,0.037836799025535585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,balanced,0.08636800448099773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,power_law_1.01,0.0377023994922638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,balanced,0.10162132978439331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,power_law_1.01,0.04013440012931824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,power_law_1.01,0.03983359932899475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,balanced,0.10961600144704182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,power_law_1.01,0.040601599216461184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,power_law_1.01,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,balanced,0.12991467118263245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,power_law_1.01,0.04368639886379242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,balanced,0.1516746679941813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,power_law_1.01,0.04612480103969574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,power_law_1.01,0.05289599895477295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,power_law_1.01,0.05377920269966126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,balanced,0.21559999386469522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,power_law_1.01,0.05733759999275208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,power_law_1.01,0.08408960103988647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,balanced,0.2585866649945577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,power_law_1.01,0.09364479780197144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,power_law_1.01,0.10611840486526489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,4,power_law_1.2,0.027846398949623107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,power_law_1.01,0.1198848009109497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,balanced,0.38097067674001056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,4,power_law_1.2,0.029580798745155335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,power_law_1.01,0.14759680032730102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,4,power_law_1.2,0.028870400786399842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,power_law_1.01,0.19044480323791504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,4,power_law_1.2,0.03240320086479187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,power_law_1.01,0.2603584051132202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,4,power_law_1.2,0.034745600819587705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,balanced,0.48520533243815106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,power_law_1.01,0.3114815950393677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,4,power_law_1.2,0.035596799850463864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,power_law_1.01,0.45171198844909666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,4,power_law_1.2,0.03735679984092712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,power_law_1.01,0.581715202331543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,4,power_law_1.2,0.037567999958992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,4,power_law_1.2,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,power_law_1.01,0.6981120109558105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,balanced,0.607205351193746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,4,power_law_1.2,0.03978239893913269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,power_law_1.01,1.0944319725036622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,4,power_law_1.2,0.040729600191116336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,4,power_law_1.2,0.044556799530982974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,power_law_1.01,2.1062143325805662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,4,power_law_1.2,0.043859198689460754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,balanced,0.031770666440327965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,4,power_law_1.2,0.04891520142555237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,balanced,0.03236799935499827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,4,power_law_1.2,0.05435519814491272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,4,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,balanced,0.9350079695383707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,balanced,0.03257599969704946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,4,power_law_1.2,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,4,power_law_1.2,0.09258239865303039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,balanced,0.03645866612593333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,4,power_law_1.2,0.10369919538497925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,4,power_law_1.2,0.11198079586029053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,balanced,0.03924266745646795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,4,power_law_1.2,0.12377599477767945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,4,power_law_1.2,0.15213439464569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,power_law_1.01,0.031385600566864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,balanced,0.04735999802748362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,4,power_law_1.2,0.21535999774932862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,4,32,power_law_1.2,0.03142400085926056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,power_law_1.01,0.03194240033626557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,4,power_law_1.2,0.2738944053649902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,power_law_1.01,0.03219200074672699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,4,32,power_law_1.2,0.03204480111598969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,power_law_1.01,0.036595198512077334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,4,power_law_1.2,0.3488703966140747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,4,32,power_law_1.2,0.03246079981327057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,power_law_1.01,0.037945601344108584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,balanced,1.8286879857381184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,balanced,0.047877331574757896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,4,power_law_1.2,0.4726463794708252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,power_law_1.01,0.04715520143508911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,4,32,power_law_1.2,0.03546879887580871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,power_law_1.01,0.04742400050163269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,balanced,0.047914668917655945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,4,32,power_law_1.2,0.03808000087738037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,4,power_law_1.2,0.6129216194152832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,power_law_1.01,0.047712001204490664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,balanced,0.02940266579389572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,4,32,power_law_1.2,0.04670720100402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,4,power_law_1.2,0.7719168186187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,4,32,power_law_1.2,0.047014400362968445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,balanced,0.030559999247392017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,4,power_law_1.2,1.2713408470153809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,4,32,power_law_1.2,0.047577598690986635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,balanced,0.03088533381621043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,power_law_1.01,0.048256000876426695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,4,power_law_1.2,2.3507711410522463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,balanced,0.033861334125200905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,4,32,power_law_1.2,0.048614400625228885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,power_law_1.01,0.04872959852218628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,balanced,0.0489333321650823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,balanced,0.03586666782697042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,4,32,power_law_1.2,0.0488319993019104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,power_law_1.01,0.05123839974403381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,balanced,0.0517493337392807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,4,32,power_law_1.2,0.051577597856521606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,balanced,0.036805334190527596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,power_law_1.01,0.05130239725112915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,balanced,0.05086400111516317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,power_law_1.01,0.057766401767730714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,balanced,0.0433599998553594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,4,32,power_law_1.2,0.051999998092651364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,balanced,0.058543999989827476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,power_law_1.01,0.05851519703865051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,balanced,0.04307200014591217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,4,32,power_law_1.2,0.0584447979927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,balanced,0.05831466615200043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,power_law_1.01,0.02932479977607727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,power_law_1.01,0.05936639904975891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,balanced,0.04258666435877482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,power_law_1.01,0.029734399914741517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,4,32,power_law_1.2,0.058950400352478026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,balanced,0.05929600199063619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,power_law_1.01,0.05934720039367676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,balanced,0.042810668547948204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,power_law_1.01,0.03245440125465393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,4,32,power_law_1.2,0.059628802537918094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,balanced,0.0595360000928243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,power_law_1.01,0.061427199840545656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,balanced,0.04383466641108195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,power_law_1.01,0.03405439853668213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,4,32,power_law_1.2,0.05987840294837952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,power_law_1.01,0.07130879759788514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,balanced,0.060234665870666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,power_law_1.01,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,power_law_1.01,0.07836800217628478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,4,32,power_law_1.2,0.061887997388839724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,balanced,0.06356266637643178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,power_law_1.01,0.041817599534988405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,power_law_1.01,0.10487680435180664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,4,32,power_law_1.2,0.07463679909706115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,balanced,0.06553600231806438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,power_law_1.01,0.04202240109443665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,power_law_1.01,0.12164479494094849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,4,32,power_law_1.2,0.08172799944877625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,balanced,0.04344533383846283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,power_law_1.01,0.0420415997505188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,balanced,0.07309333483378093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,power_law_1.01,0.1715008020401001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,balanced,0.04586133360862732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,power_law_1.01,0.04264320135116577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,4,32,power_law_1.2,0.11317119598388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,power_law_1.01,0.21484799385070802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,balanced,0.0844106674194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,power_law_1.01,0.042630401253700254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,4,32,power_law_1.2,0.13674240112304686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,power_law_1.01,0.34459519386291504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,power_law_1.01,0.043398401141166686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,balanced,0.10195199648539226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,balanced,0.049072002371152244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,4,32,power_law_1.2,0.18484480381011964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,power_law_1.01,0.406009578704834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,power_law_1.01,0.04478079974651337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,balanced,0.05596800148487091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,power_law_1.2,0.23553919792175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,power_law_1.01,0.6177984237670898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,power_law_1.01,0.0490880012512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,4,32,balanced,0.1222879985968272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,balanced,0.05726933479309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,power_law_1.2,0.35350399017333983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,power_law_1.01,0.8156671524047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,power_law_1.01,0.04885759949684143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,balanced,0.06006933252016703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,power_law_1.2,0.4261119842529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,power_law_1.01,0.05585920214653015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,power_law_1.01,0.9054464340209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,4,32,balanced,0.16192533572514853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,power_law_1.2,0.6409791946411133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,power_law_1.01,0.0576960027217865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,power_law_1.01,1.5559359550476075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,balanced,0.06187200049559275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,power_law_1.01,0.06724479794502258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,power_law_1.2,0.8760448455810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,power_law_1.01,0.07322880029678344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,power_law_1.01,3.177248001098633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,balanced,0.0713866651058197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,4,32,balanced,0.20382932821909586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,power_law_1.2,1.0830719947814942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,power_law_1.01,0.091430401802063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,balanced,0.08386666576067607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,power_law_1.01,0.09912959933280945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,power_law_1.2,1.7107904434204102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,power_law_1.01,0.1351040005683899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,balanced,0.10601066549619038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,4,32,balanced,0.29678932825724286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,power_law_1.01,0.1827455997467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,power_law_1.2,3.288409423828125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,power_law_1.01,0.2524224042892456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,balanced,0.12663466731707254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,power_law_1.01,0.3849152088165283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,power_law_1.01,0.49080958366394045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,balanced,0.16691199938456217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,4,32,balanced,0.38228801886240643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,power_law_1.01,0.6841728210449218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,power_law_1.01,0.7990848064422608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,balanced,0.20551466941833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,power_law_1.01,1.3648384094238282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,power_law_1.01,2.6438207626342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,4,32,balanced,0.472213347752889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,balanced,0.3041440049807231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,16,power_law_1.2,0.029145601391792297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,balanced,0.38532265027364093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,16,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,4,32,balanced,0.7418613433837891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,16,power_law_1.2,0.02956799864768982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,16,power_law_1.2,0.032467201352119446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,16,power_law_1.2,0.033958399295806886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,balanced,0.47404801845550537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,16,power_law_1.2,0.036601600050926206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,16,power_law_1.2,0.04327679872512817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,16,power_law_1.2,0.04227199852466583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,16,power_law_1.2,0.04177280068397522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,16,power_law_1.2,0.04340479969978332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,16,power_law_1.2,0.04323840141296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,16,power_law_1.2,0.04344319999217987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,16,power_law_1.2,0.04536960124969482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,16,power_law_1.2,0.048511999845504764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,balanced,0.7421440283457438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,16,power_law_1.2,0.04919680058956146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,16,power_law_1.2,0.055615997314453124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,16,power_law_1.2,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,4,32,balanced,1.4612053235371907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,16,power_law_1.2,0.0697920024394989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,16,power_law_1.2,0.07552639842033386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,16,power_law_1.2,0.09735680222511292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,16,power_law_1.2,0.10907520055770874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,16,power_law_1.2,0.17761919498443604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,16,power_law_1.2,0.21436800956726074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,balanced,0.0271519993742307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,16,power_law_1.2,0.3204351902008057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,balanced,0.02796799937884013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,16,power_law_1.2,0.4148672103881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,balanced,0.028597332537174225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,16,power_law_1.2,0.6572991847991944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,16,power_law_1.2,0.8647551536560059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,balanced,0.03141866624355316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,16,power_law_1.2,1.03755521774292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,balanced,0.033439998825391136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,balanced,0.033930666744709015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,16,power_law_1.2,1.855072021484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,balanced,0.03637866675853729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,balanced,1.4564266204833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,16,power_law_1.2,3.6896575927734374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,balanced,0.03618666778008143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,balanced,0.04048000027736028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,balanced,0.0401653324564298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,power_law_1.01,0.02778240144252777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,balanced,0.041493333876132965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,balanced,0.041450666884581246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,power_law_1.01,0.027820798754692077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,balanced,0.04218133290608724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,balanced,0.04256533086299896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,power_law_1.01,0.03061760067939758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,balanced,0.04470933477083842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,power_law_1.01,0.03219839930534363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,balanced,0.04789333542188009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,balanced,0.04971200227737427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,power_law_1.01,0.033983999490737916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,power_law_1.01,0.03646720051765442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,balanced,0.05886933207511902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,power_law_1.01,0.03585920035839081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,balanced,0.06107733150323232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,power_law_1.01,0.04190720021724701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,balanced,0.07605866591135661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,power_law_1.01,0.04142079949378967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,power_law_1.01,0.04179840087890625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,balanced,0.0876533289750417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,8,power_law_1.2,0.02746239900588989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,power_law_1.01,0.04232960045337677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,balanced,0.11003733674685161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,power_law_1.01,0.043705600500106814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,8,power_law_1.2,0.0278656005859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,balanced,0.13272533814112344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,power_law_1.01,0.04381439983844757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,8,power_law_1.2,0.02803199887275696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,power_law_1.01,0.04700160026550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,8,power_law_1.2,0.030643200874328612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,power_law_1.01,0.052025598287582395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,balanced,0.1772800087928772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,8,power_law_1.2,0.03207040131092072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,power_law_1.01,0.05454720258712768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,8,power_law_1.2,0.033504000306129454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,balanced,0.02672533442576726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,power_law_1.01,0.06880639791488648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,balanced,0.22355733315149942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,8,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,power_law_1.01,0.07404159903526306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,balanced,0.028037334481875103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,8,power_law_1.2,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,power_law_1.01,0.08583679795265198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,balanced,0.028832000990708668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,8,power_law_1.2,0.041440001130104064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,balanced,0.0316746657093366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,power_law_1.01,0.1003648042678833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,8,power_law_1.2,0.041484799981117246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,balanced,0.3281866709391276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,balanced,0.032933334509531655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,power_law_1.01,0.14591360092163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,8,power_law_1.2,0.04238080084323883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,balanced,0.0323840007185936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,8,power_law_1.2,0.04306559860706329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,power_law_1.01,0.19185919761657716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,balanced,0.03409600009520849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,8,power_law_1.2,0.04287360012531281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,balanced,0.03409600009520849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,power_law_1.01,0.2595839977264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,power_law_1.01,0.02696320116519928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,8,power_law_1.2,0.04380159974098206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,balanced,0.42077334721883136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,balanced,0.035631999373435974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,power_law_1.01,0.35514240264892577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,power_law_1.01,0.02766079902648926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,8,power_law_1.2,0.04832639992237091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,balanced,0.03595199932654699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,power_law_1.01,0.4534912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,power_law_1.01,0.02797439992427826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,8,power_law_1.2,0.05363199710845947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,balanced,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,power_law_1.01,0.030931198596954347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,power_law_1.01,0.6132863998413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,8,power_law_1.2,0.05676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,balanced,0.04301866888999939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,balanced,0.043893332282702126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,8,power_law_1.2,0.0692736029624939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,power_law_1.01,0.03207040131092072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,power_law_1.01,0.7300415992736816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,balanced,0.5230400164922079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,balanced,0.04401599864164988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,8,power_law_1.2,0.0821120023727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,power_law_1.01,0.0319680005311966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,power_law_1.01,1.3693632125854491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,balanced,0.044922664761543274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,8,power_law_1.2,0.09318400025367737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,power_law_1.01,2.8369407653808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,8,power_law_1.2,0.11112320423126221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,balanced,0.045824001232783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,power_law_1.01,0.034195199608802795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,8,power_law_1.2,0.15221760272979737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,balanced,0.04831466575463613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,power_law_1.01,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,8,power_law_1.2,0.2180095911026001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,power_law_1.01,0.03601920008659363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,balanced,0.056330665946006775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,power_law_1.01,0.03716480135917664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,8,power_law_1.2,0.33680000305175783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,balanced,0.06268799801667531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,power_law_1.01,0.043961599469184875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,8,power_law_1.2,0.44829440116882324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,balanced,0.815877358118693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,power_law_1.01,0.04390400052070618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,balanced,0.08358933528264363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,power_law_1.01,0.04674560129642487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,8,power_law_1.2,0.5802624225616455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,balanced,0.09299199779828389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,power_law_1.01,0.047251200675964354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,8,power_law_1.2,0.7681856155395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,power_law_1.01,0.04912639856338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,8,power_law_1.2,1.0931712150573731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,balanced,0.11805333693822224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,power_law_1.01,0.05351679921150208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,power_law_1.01,0.06495360136032105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,8,power_law_1.2,1.7226303100585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,balanced,0.14401599764823914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,power_law_1.01,0.07305600047111512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,power_law_1.01,0.09103360176086425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,power_law_1.2,3.7005630493164063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,power_law_1.01,0.1053887963294983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,balanced,0.19506667057673135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,power_law_1.01,0.13362560272216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,4,power_law_1.2,0.02683520019054413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,power_law_1.01,0.18934400081634523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,4,power_law_1.2,0.02778240144252777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,power_law_1.01,0.2612544059753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,balanced,0.24698134263356528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,4,power_law_1.2,0.027910399436950683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,power_law_1.01,0.31297280788421633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,4,power_law_1.2,0.030656000971794127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,4,power_law_1.2,0.03163520097732544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,power_law_1.01,0.5185535907745361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,8,balanced,1.6008532842000325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,4,power_law_1.2,0.03244799971580505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,power_law_1.01,0.6753024101257324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,balanced,0.36767999331156415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,4,power_law_1.2,0.03356800079345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,power_law_1.01,0.7823679924011231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,balanced,0.029861333469549816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,balanced,0.03197866678237915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,4,power_law_1.2,0.034796801209449765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,balanced,0.0320266659061114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,4,power_law_1.2,0.03548159897327423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,balanced,0.02956799914439519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,power_law_1.01,1.2376959800720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,balanced,0.03230399886767069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,4,power_law_1.2,0.035955199599266054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,balanced,0.02956266701221466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,balanced,0.4704960187276204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,balanced,0.033904001116752625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,4,power_law_1.2,0.03717760145664215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,balanced,0.03357866654793421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,balanced,0.030618667602539062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,power_law_1.01,2.410508728027344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,balanced,0.03396799912055334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,4,power_law_1.2,0.04397439956665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,balanced,0.031194667021433514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,balanced,0.035445332527160645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,balanced,0.031178665657838184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,4,power_law_1.2,0.04451839923858643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,balanced,0.03505066782236099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,balanced,0.030917334059874218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,balanced,0.035989334185918175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,4,power_law_1.2,0.04648320078849792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,balanced,0.5899840195973715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,balanced,0.03595733394225439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,balanced,0.03649600098530451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,balanced,0.035962666074434914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,balanced,0.03675200045108795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,balanced,0.03633599976698557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,4,power_law_1.2,0.0473471999168396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,balanced,0.03738133360942205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,balanced,0.036277333895365395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,4,power_law_1.2,0.048665601015090945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,balanced,0.04162133236726125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,balanced,0.04131733377774557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,balanced,0.03628266602754593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,4,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,balanced,0.04297600189844767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,balanced,0.03751466671625773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,balanced,0.047482664386431374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,4,power_law_1.2,0.06641280055046081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,balanced,0.04940799872080485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,balanced,0.036837334434191384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,4,power_law_1.2,0.07446399927139283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,balanced,0.06531733274459839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,balanced,0.07170666754245758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,balanced,0.04308799902598063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,balanced,0.9121493498484293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,4,power_law_1.2,0.09071360230445862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,balanced,0.09692266583442688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,balanced,0.0447626660267512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,4,power_law_1.2,0.11081600189208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,balanced,0.04650133351484934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,balanced,0.10921600461006165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,4,power_law_1.2,0.15253119468688964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,balanced,0.04354666670163473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,4,power_law_1.2,0.1874943971633911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,balanced,0.15044266978899637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,balanced,0.044938668608665466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,4,power_law_1.2,0.26784639358520507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,balanced,0.04515733321507772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,4,power_law_1.2,0.36883840560913084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,balanced,0.17540266116460165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,balanced,0.06261333326498668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,4,power_law_1.2,0.5016191959381103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,balanced,0.055200000603993736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,balanced,0.2516000072161357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,4,power_law_1.2,0.6279935836791992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,balanced,0.07675200204054515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,4,power_law_1.2,0.929964828491211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,balanced,0.31164799133936566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,4,power_law_1.2,1.4029312133789062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,balanced,0.0745600014925003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,power_law_1.2,2.87259521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,balanced,0.10842133561770122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,balanced,0.39447466532389325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,4,balanced,1.7903733253479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,balanced,0.11160000165303548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,balanced,0.583957314491272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,balanced,0.16498667001724243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,balanced,0.19200533628463745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,balanced,0.26103466749191284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,balanced,1.1553333600362141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,balanced,0.35622398058573407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,balanced,0.025386666258176167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,balanced,0.025477332373460133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,balanced,0.027248000105222065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,balanced,0.02700799951950709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,balanced,0.027610667049884796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,balanced,0.02828799933195114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,balanced,0.027722666660944622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,balanced,0.027914665639400482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,balanced,0.6920053164164225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,balanced,0.028384000062942505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.01,0.028812798857688903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.01,0.031404799222946166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.01,0.028838399052619933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.01,0.03142400085926056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,balanced,0.028101332485675812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.01,0.029785600304603577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,balanced,0.02882666637500127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.01,0.029996800422668456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.01,0.033632001280784606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,balanced,0.029631999631722767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.01,0.03361920118331909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.01,0.03438720107078552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,balanced,0.028373333315054577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.01,0.04142079949378967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.01,0.03501439988613129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.01,0.034643200039863584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.01,0.03573119938373566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.01,0.03587839901447296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.01,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.01,0.03560959994792938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.01,0.03678719997406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.01,0.03894400000572205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,balanced,0.035205334424972534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.01,0.040275201201438904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.01,0.038431999087333676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,balanced,0.035029334326585136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.01,0.04220159947872162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.01,0.03840000033378601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,balanced,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.01,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.01,0.0383679986000061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.01,0.044761601090431216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.01,0.0465472012758255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.01,0.04723840057849884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.01,0.05453439950942993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,balanced,0.03991466760635376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.01,0.0530239999294281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.01,0.05144320130348205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,balanced,0.0413973331451416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.01,0.06776319742202759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.01,0.05799040198326111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.01,0.0697983980178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,power_law_1.01,0.024672000110149382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.01,0.0710207998752594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.01,0.09597439765930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.01,0.08785279989242553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.01,0.10990079641342163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,power_law_1.01,0.024876800179481507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.01,0.11809279918670654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.01,0.15312639474868775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,power_law_1.01,0.024934400618076325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.01,0.1096384048461914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,balanced,0.05007466673851013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.01,0.17070080041885377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,power_law_1.01,0.026528000831604004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.01,0.13497600555419922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.01,0.24368638992309571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.01,0.16706559658050538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,power_law_1.01,0.026655998826026917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.01,0.2997119903564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.01,0.2685312032699585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,power_law_1.01,0.027590399980545043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.01,0.4344319820404053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,power_law_1.01,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.01,0.5423744201660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,balanced,0.05622399846712748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.01,0.2934528112411499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,power_law_1.01,0.028460800647735596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.01,0.725651216506958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.01,0.40177278518676757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,power_law_1.01,0.028940799832344054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.01,1.1668800354003905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.01,0.5551487922668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,power_law_1.01,0.03047040104866028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.01,2.2335744857788087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,balanced,0.07334400216738383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.01,0.7022528171539306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.01,1.0366016387939454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,power_law_1.01,0.030937600135803222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.01,2.0164159774780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,power_law_1.01,0.034822401404380796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,balanced,0.08869866530100505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,power_law_1.01,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,power_law_1.01,0.039078399538993835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,balanced,0.12288000186284383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,power_law_1.01,0.04602240025997162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,14336,2,8,32,8,power_law_1.2,0.029209598898887634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,power_law_1.01,0.04953599870204926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,14336,2,8,32,8,power_law_1.2,0.03126400113105774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,14336,2,8,32,8,power_law_1.2,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,power_law_1.01,0.05493760108947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,14336,2,8,32,8,power_law_1.2,0.029151999950408937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,14336,2,8,32,8,power_law_1.2,0.031206399202346802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,14336,2,8,32,8,power_law_1.2,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,power_law_1.01,0.07090560197830201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,14336,2,8,32,8,power_law_1.2,0.029849600791931153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,balanced,0.14696000019709268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,14336,2,8,32,8,power_law_1.2,0.03349120020866394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,power_law_1.01,0.08243839740753174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,14336,2,8,32,8,power_law_1.2,0.030092799663543703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,14336,2,8,32,8,power_law_1.2,0.033452799916267394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,14336,2,8,32,8,power_law_1.2,0.03961600065231323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,14336,2,8,32,8,power_law_1.2,0.03454079926013946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,balanced,0.23463465770085654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,14336,2,8,32,8,power_law_1.2,0.04280959963798523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,14336,2,8,32,8,power_law_1.2,0.03506560027599335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,power_law_1.01,0.09512959718704224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,14336,2,8,32,8,power_law_1.2,0.0359935998916626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,14336,2,8,32,8,power_law_1.2,0.03519999980926514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,14336,2,8,32,8,power_law_1.2,0.036774399876594546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,balanced,0.29470932483673096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,14336,2,8,32,8,power_law_1.2,0.037062400579452516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,14336,2,8,32,8,power_law_1.2,0.03723520040512085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,14336,2,8,32,8,power_law_1.2,0.036364799737930296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,power_law_1.01,0.13963520526885986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,14336,2,8,32,8,power_law_1.2,0.03800320029258728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,14336,2,8,32,8,power_law_1.2,0.03696640133857727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,14336,2,8,32,8,power_law_1.2,0.04067200124263763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,14336,2,8,32,8,power_law_1.2,0.03953279852867127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,power_law_1.01,0.18280320167541503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,14336,2,8,32,8,power_law_1.2,0.02481919974088669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,14336,2,8,32,8,power_law_1.2,0.04074879884719849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,14336,2,8,32,8,power_law_1.2,0.03904640078544617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,14336,2,8,32,8,power_law_1.2,0.04076800048351288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,14336,2,8,32,8,power_law_1.2,0.02500480115413666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,14336,2,8,32,8,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,power_law_1.01,0.22316160202026367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,14336,2,8,32,8,power_law_1.2,0.04373759925365448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,14336,2,8,32,8,power_law_1.2,0.025196799635887147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,balanced,0.37460267543792725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,14336,2,8,32,8,power_law_1.2,0.05394560098648071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,14336,2,8,32,8,power_law_1.2,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,14336,2,8,32,8,power_law_1.2,0.04714879989624023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,power_law_1.01,0.36528000831604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,14336,2,8,32,8,power_law_1.2,0.026956799626350402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,14336,2,8,32,8,power_law_1.2,0.0545087993144989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,14336,2,8,32,8,power_law_1.2,0.04878720045089722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,14336,2,8,32,8,power_law_1.2,0.027340799570083618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,14336,2,8,32,8,power_law_1.2,0.06549760103225707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,14336,2,8,32,8,power_law_1.2,0.058310401439666745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,14336,2,8,32,8,power_law_1.2,0.027871999144554137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,power_law_1.01,0.37805440425872805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,14336,2,8,32,8,power_law_1.2,0.07096319794654846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,balanced,0.559829314549764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,14336,2,8,32,8,power_law_1.2,0.02821120023727417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,14336,2,8,32,8,power_law_1.2,0.07428479790687562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,power_law_1.01,0.7297855854034424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,14336,2,8,32,8,power_law_1.2,0.09569919705390931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,14336,2,8,32,8,power_law_1.2,0.028620800375938414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,14336,2,8,32,8,power_law_1.2,0.08681600093841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,14336,2,8,32,8,power_law_1.2,0.02959359884262085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,14336,2,8,32,8,power_law_1.2,0.10833280086517334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,power_law_1.01,0.9008064270019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,14336,2,8,32,8,power_law_1.2,0.11959680318832397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,balanced,0.03692266593376795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,14336,2,8,32,8,power_law_1.2,0.15149439573287965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,14336,2,8,32,8,power_law_1.2,0.11563520431518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,14336,2,8,32,8,power_law_1.2,0.1733888030052185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,balanced,0.0366293340921402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,power_law_1.01,1.151148796081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,14336,2,8,32,8,power_law_1.2,0.030099201202392577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,14336,2,8,32,8,power_law_1.2,0.16157439947128296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,14336,2,8,32,8,power_law_1.2,0.2598400115966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,balanced,0.03712533414363861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,14336,2,8,32,8,power_law_1.2,0.03464959859848023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,14336,2,8,32,8,power_law_1.2,0.31448318958282473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,power_law_1.01,1.6811136245727538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,14336,2,8,32,8,power_law_1.2,0.18632320165634156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,balanced,0.03763733307520548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,14336,2,8,32,8,power_law_1.2,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,14336,2,8,32,8,power_law_1.2,0.4414976119995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,power_law_1.01,3.607884979248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,balanced,0.038032000263532005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,14336,2,8,32,8,power_law_1.2,0.2725183963775635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,14336,2,8,32,8,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,balanced,1.096186637878418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,14336,2,8,32,8,power_law_1.2,0.6044095993041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,balanced,0.04192000130812327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,14336,2,8,32,8,power_law_1.2,0.29310081005096433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,14336,2,8,32,8,power_law_1.2,0.7500927925109864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,balanced,0.04271999994913737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,14336,2,8,32,8,power_law_1.2,0.4203519821166992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,14336,2,8,32,8,power_law_1.2,1.1459648132324218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,14336,2,8,32,8,power_law_1.2,0.045638400316238406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,balanced,0.04204266766707102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,14336,2,8,32,8,power_law_1.2,0.563040018081665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,14336,2,8,32,8,power_law_1.2,2.235321617126465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,14336,2,8,32,8,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,balanced,0.042581334710121155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,14336,2,8,32,8,power_law_1.2,0.6468800067901611
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,14336,2,8,32,8,power_law_1.2,0.05603839755058289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,balanced,0.042090664307276406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,14336,2,8,32,8,power_law_1.2,1.0504960060119628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,balanced,0.043290664752324425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,14336,2,8,32,8,power_law_1.2,0.07129600048065185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,14336,2,8,32,8,power_law_1.2,2.147052764892578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,balanced,0.044480000933011375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,14336,2,8,32,8,power_law_1.2,0.08298879861831665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,balanced,0.04423999786376953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,balanced,0.04455466568470001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,14336,2,8,32,8,power_law_1.2,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,balanced,0.04935466746489207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,balanced,0.05020800232887268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,14336,2,8,32,8,power_law_1.2,0.1402176022529602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,balanced,0.053445334235827126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,balanced,0.060421332716941833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,14336,2,8,32,8,power_law_1.2,0.198470401763916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,balanced,0.058634668588638306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,14336,2,8,32,8,power_law_1.2,0.22878720760345458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,balanced,0.06621333460013072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,14336,2,8,32,8,power_law_1.2,0.35916159152984617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,balanced,0.07544533411661784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,balanced,0.09545600414276123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,14336,2,8,32,8,power_law_1.2,0.42136321067810056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,14336,2,8,32,8,power_law_1.2,0.7343935966491699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,balanced,0.10081600149472554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,14336,2,8,32,8,power_law_1.2,0.9145407676696777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,balanced,0.15341867009798685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,14336,2,8,32,8,power_law_1.2,1.1841728210449218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,14336,2,8,32,8,power_law_1.2,1.8128128051757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,balanced,0.15482133626937866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,14336,2,8,32,8,power_law_1.2,3.4944126129150392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,balanced,0.03533333291610082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,balanced,0.03530666728814443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,balanced,0.035786665976047516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,balanced,0.23869866132736206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,balanced,0.03678400069475174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,balanced,0.03643733263015747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,balanced,0.26844267050425213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,balanced,0.03713600089152654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,balanced,0.03843733419974645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,balanced,0.037765334049860634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,balanced,0.37468798955281574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,balanced,0.037434667348861694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,balanced,0.02903999884923299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,balanced,0.038405333956082664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,balanced,0.029109333952267964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,balanced,0.03995199998219808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,balanced,0.028768000503381092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,balanced,0.040063999593257904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,balanced,0.030773334205150604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,balanced,0.040063999593257904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,balanced,0.498149315516154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,balanced,0.030640001098314922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,balanced,0.04005866746107737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,balanced,0.03139200061559677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,balanced,0.045935998360315956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,balanced,0.03188266605138779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,balanced,0.046256000796953835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,balanced,0.03150933235883713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,balanced,0.0480373352766037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,balanced,0.03177600105603536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,balanced,0.05857066810131073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,balanced,0.03286933402220408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,balanced,0.06559466818968455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,balanced,0.9849920272827148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,balanced,0.08190933366616567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,balanced,0.09232532978057861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,balanced,0.03173333406448364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,balanced,0.11960533261299133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,balanced,0.03249600032965342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,balanced,0.03356266766786575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,balanced,0.14190933108329773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,balanced,0.032058666149775185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,balanced,0.19941866397857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,balanced,0.23838933308919272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,balanced,0.039434666434923805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,balanced,0.040133332212766014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,balanced,0.3475573460261027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,balanced,0.04072533299525579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.01,0.03447679877281189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.01,0.036185601353645326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,balanced,0.4303733507792155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.01,0.034585601091384886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,balanced,0.04720533390839895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.01,0.03630079925060272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.01,0.0350847989320755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,balanced,0.05044800043106079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.01,0.03597440123558045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.01,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.01,0.03694080114364624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.01,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.01,0.03720960021018982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,balanced,0.5514880021413168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.01,0.03701759874820709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.01,0.055878400802612305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.01,0.03803519904613495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.01,0.05820159912109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,16384,2,8,32,8,power_law_1.2,0.036268800497055054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.01,0.03816959857940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,balanced,0.0662666658560435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.01,0.04013440012931824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.01,0.04364160001277924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,power_law_1.01,0.030041599273681642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,16384,2,8,32,8,power_law_1.2,0.03598720133304596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.01,0.04147840142250061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.01,0.04467839896678925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,balanced,0.8259893258412679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,16384,2,8,32,8,power_law_1.2,0.03641600012779236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,power_law_1.01,0.02800639867782593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.01,0.04141440093517303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.01,0.04746879935264588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,balanced,0.07528000076611836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,16384,2,8,32,8,power_law_1.2,0.03729279935359955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.01,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,power_law_1.01,0.028095999360084535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.01,0.048281601071357726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.01,0.04418559968471527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,power_law_1.01,0.029721599817276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,16384,2,8,32,8,power_law_1.2,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.01,0.04940159916877747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.01,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.01,0.04577920138835907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,power_law_1.01,0.029951998591423036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,16384,2,8,32,8,power_law_1.2,0.05333120226860046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,balanced,0.0990666647752126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.01,0.05237119793891907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.01,0.06034560203552246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,16384,2,8,32,8,power_law_1.2,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.01,0.05429760217666626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.01,0.07386239767074584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,power_law_1.01,0.03308799862861633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,16384,2,8,32,8,power_law_1.2,0.04339199960231781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.01,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.01,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,power_law_1.01,0.03320960104465485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,16384,2,8,32,8,power_law_1.2,0.04439040124416351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.01,0.10247679948806762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.01,0.08179839849472045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,balanced,0.11827199657758077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,16384,2,8,32,8,power_law_1.2,0.044198399782180785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,balanced,1.6562986373901367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,power_law_1.01,0.03432320058345795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.01,0.09462400078773499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.01,0.09228159785270691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,16384,2,8,32,8,power_law_1.2,0.047251200675964354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.01,0.124236798286438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,power_law_1.01,0.03492479920387268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.01,0.12247680425643921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,16384,2,8,32,8,power_law_1.2,0.04875519871711731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.01,0.1385151982307434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.01,0.13262720108032228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.01,0.20200319290161134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,16384,2,8,32,8,power_law_1.2,0.050783997774124144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.01,0.19196159839630128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.01,0.24977281093597412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,power_law_1.01,0.03429119884967804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,16384,2,8,32,8,power_law_1.2,0.05262079834938049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.01,0.23834240436553955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.01,0.41799678802490237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,balanced,0.16618667046229044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,16384,2,8,32,8,power_law_1.2,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.01,0.45958399772644043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.01,0.3559231996536255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,16384,2,8,32,8,power_law_1.2,0.07497599720954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,power_law_1.01,0.03824639916419983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.01,0.6457983970642089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.01,0.4254464149475098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,balanced,0.21644800901412964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,16384,2,8,32,8,power_law_1.2,0.08236799836158752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,power_law_1.01,0.04982399940490723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.01,0.800102424621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.01,0.6197247982025147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,16384,2,8,32,8,power_law_1.2,0.11445120573043824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.01,0.9478272438049317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.01,0.8325951576232911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,balanced,0.33604268232981366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,16384,2,8,32,8,power_law_1.2,0.09748479723930359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.01,1.4825599670410157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.01,1.0354623794555664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,16384,2,8,32,8,power_law_1.2,0.13173120021820067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,power_law_1.01,0.05013759732246399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,16384,2,8,32,8,power_law_1.2,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.01,2.6125055313110352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,16384,2,8,32,8,power_law_1.2,0.13647359609603882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.01,1.6282751083374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,power_law_1.01,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,balanced,0.4123680194218953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,16384,2,8,32,8,power_law_1.2,0.03438720107078552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,16384,2,8,32,8,power_law_1.2,0.19663360118865966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,power_law_1.01,0.0629696011543274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,16384,2,8,32,8,power_law_1.2,0.2740607976913452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,16384,2,8,32,8,power_law_1.2,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.01,3.1542720794677734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,16384,2,8,32,8,power_law_1.2,0.42181758880615233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,16384,2,8,32,8,power_law_1.2,0.03607679903507233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,power_law_1.01,0.10190080404281616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,16384,2,8,32,8,power_law_1.2,0.03606399893760681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,16384,2,8,32,8,power_law_1.2,0.4535808086395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,power_law_1.01,0.1207360029220581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,16384,2,8,32,8,power_law_1.2,0.03723520040512085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,16384,2,8,32,8,power_law_1.2,0.5729983806610107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,16384,2,8,32,8,power_law_1.2,0.03805440068244934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,balanced,0.5373919804890951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,16384,2,8,32,8,power_law_1.2,0.7923264026641845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,16384,2,8,32,8,power_law_1.2,0.9899968147277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,16384,2,8,32,8,power_law_1.2,0.039417600631713866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,power_law_1.01,0.15996160507202148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,16384,2,8,32,8,power_law_1.2,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,16384,2,8,32,8,power_law_1.2,1.6227455139160156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,16384,2,8,32,8,power_law_1.2,0.04186240136623383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,16384,2,8,32,8,power_law_1.2,2.8006912231445313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,power_law_1.01,0.21530239582061766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,balanced,0.7930933634440104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,16384,2,8,32,8,power_law_1.2,0.04059520065784454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,power_law_1.01,0.2857856035232544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,16384,2,8,32,8,power_law_1.2,0.04677119851112366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,16384,2,8,32,8,power_law_1.2,0.04481280148029328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,power_law_1.01,0.3445503950119019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,16384,2,8,32,8,power_law_1.2,0.04726400077342987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,16384,2,8,32,8,power_law_1.2,0.0543615996837616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,16384,2,8,32,8,power_law_1.2,0.0549888014793396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,power_law_1.01,0.516435194015503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,16384,2,8,32,8,power_law_1.2,0.06483200192451477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,power_law_1.01,0.6605311870574951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,16384,2,8,32,8,power_law_1.2,0.0824512004852295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,balanced,1.5645546913146973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,16384,2,8,32,8,power_law_1.2,0.08946560025215149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,power_law_1.01,0.9998016357421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,16384,2,8,32,8,power_law_1.2,0.12632319927215577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,power_law_1.01,1.2729280471801758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,16384,2,8,32,8,power_law_1.2,0.1323904037475586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,power_law_1.01,1.7427648544311523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,16384,2,8,32,8,power_law_1.2,0.19692800045013428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,16384,2,8,32,8,power_law_1.2,0.25160319805145265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,power_law_1.01,2.545235252380371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,16384,2,8,32,8,power_law_1.2,0.34305920600891116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,16384,2,8,32,8,power_law_1.2,0.028191998600959778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,power_law_1.01,5.087993621826172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,16384,2,8,32,8,power_law_1.2,0.421446418762207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,16384,2,8,32,8,power_law_1.2,0.028191998600959778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,16384,2,8,32,8,power_law_1.2,0.5998528003692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,16384,2,8,32,8,power_law_1.2,0.028531199693679808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,16384,2,8,32,8,power_law_1.2,0.8315199851989746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,16384,2,8,32,8,power_law_1.2,0.030086401104927062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,16384,2,8,32,8,power_law_1.2,1.0347583770751954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,16384,2,8,32,8,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,16384,2,8,32,8,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,16384,2,8,32,8,power_law_1.2,1.6532159805297852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,16384,2,8,32,8,power_law_1.2,0.03307519853115082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,16384,2,8,32,8,power_law_1.2,2.9241216659545897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,16384,2,8,32,8,power_law_1.2,0.034329599142074584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,16384,2,8,32,8,power_law_1.2,0.03427839875221252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,16384,2,8,32,8,power_law_1.2,0.035673600435256955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,16384,2,8,32,8,power_law_1.2,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,16384,2,8,32,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,16384,2,8,32,8,power_law_1.2,0.04256640076637268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,16384,2,8,32,8,power_law_1.2,0.05088000297546387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,16384,2,8,32,8,power_law_1.2,0.055174398422241214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,16384,2,8,32,8,power_law_1.2,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,16384,2,8,32,8,power_law_1.2,0.06845440268516541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,16384,2,8,32,8,power_law_1.2,0.10022399425506592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,16384,2,8,32,8,power_law_1.2,0.1261247992515564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,16384,2,8,32,8,power_law_1.2,0.167302405834198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,16384,2,8,32,8,power_law_1.2,0.21753599643707275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,16384,2,8,32,8,power_law_1.2,0.2941312074661255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,16384,2,8,32,8,power_law_1.2,0.3438976049423218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,16384,2,8,32,8,power_law_1.2,0.5269760131835938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,16384,2,8,32,8,power_law_1.2,0.6665088176727295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,16384,2,8,32,8,power_law_1.2,1.023078441619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,16384,2,8,32,8,power_law_1.2,1.2503744125366212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,16384,2,8,32,8,power_law_1.2,1.6784767150878905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,16384,2,8,32,8,power_law_1.2,2.485228729248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,16384,2,8,32,8,power_law_1.2,5.151609420776367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,balanced,0.19764800866444907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,balanced,0.18860799074172974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,balanced,0.18951465686162314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,balanced,0.19989333550135294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,balanced,0.1986773411432902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,balanced,0.19549334049224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,balanced,0.1981226603190104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,balanced,0.11928000052769978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,balanced,0.19668267170588175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,balanced,0.11548266808191936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,balanced,0.19371734062830606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,balanced,0.12024000287055969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,balanced,0.19868266582489014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,balanced,0.12281599640846252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,balanced,0.20200000206629434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,balanced,0.11990400155385335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,balanced,0.11846933762232463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,balanced,0.1928106745084127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,balanced,0.11746133367220561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.1919360041618347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,balanced,0.1981226603190104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,balanced,0.12519466876983643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.18785279989242554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,balanced,0.1904159982999166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,balanced,0.055349335074424744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,balanced,0.13149866461753845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.1890112042427063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,balanced,0.19588265816370645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,balanced,0.12794133027394614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.18145920038223268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,balanced,0.05317866802215576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,balanced,0.2055520017941793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.18810240030288697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,balanced,0.12924266854921976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,balanced,0.055973331133524575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.19943679571151735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,balanced,0.18835200866063437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,balanced,0.060517330964406334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,balanced,0.12390933434168498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.19520000219345093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,balanced,0.19152534008026123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,balanced,0.06146133442719778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.1920575976371765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,balanced,0.13032000263532004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.19841920137405394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,balanced,0.05881600081920624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,balanced,0.19699732462565103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,balanced,0.12521066268285116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.18670719861984253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,balanced,0.06037333110968272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.18398720026016235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,balanced,0.06071466704209646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,balanced,0.13831999897956848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,balanced,0.20130133628845215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.17905280590057374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,balanced,0.061237335205078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,balanced,0.13277332981427512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.17504639625549318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,balanced,0.06192533175150553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.16866559982299806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,balanced,0.20081067085266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,balanced,0.13403200109799704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,balanced,0.06282133360703786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.16701439619064332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,balanced,0.06314133107662201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.15603840351104736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,balanced,0.14080533385276794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,balanced,0.06491733094056447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.1469696044921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,balanced,0.2048693299293518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,balanced,0.15505599975585938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.256876802444458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,balanced,0.06534400085608165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.2321471929550171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,balanced,0.07045333087444305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,balanced,0.17047999302546182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.3273024082183838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.11713919639587403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,balanced,0.07147733370463054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,balanced,0.19741332530975342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.40932478904724123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,balanced,0.07486933469772339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.11384960412979125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,balanced,0.18091734250386557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.5673408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,balanced,0.08238933483759563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.7791615962982178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.11971839666366577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.01,1.1795968055725097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,balanced,0.3562613328297933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.12433919906616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,balanced,0.20964799324671426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.01,1.377676773071289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.12288000583648681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.01,2.291622352600098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.12406400442123414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.01,3.2682815551757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,balanced,0.23358400662740073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.12723840475082399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,balanced,0.08912000060081482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,balanced,0.3399733304977417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.01,4.2535041809082035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.12467199563980103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.12037119865417481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,balanced,0.10150933265686035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.01,8.365875244140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,power_law_1.01,0.05486720204353333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,balanced,0.3568906784057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.12013440132141114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,power_law_1.01,0.05241600275039673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,balanced,0.11276266972223918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.12157440185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.1922368049621582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.01,15.660089111328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,power_law_1.01,0.05231999754905701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.11857919692993164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.1872383952140808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,balanced,0.4971253474553426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,power_law_1.01,0.05694720149040222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.11866240501403809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.18570879697799683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,balanced,0.40324799219767254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,power_law_1.01,0.0581055998802185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.11889920234680176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.18718719482421875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,power_law_1.01,0.05907840132713318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.1253056049346924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.18869119882583618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,power_law_1.01,0.059571200609207155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.1162943959236145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.19166719913482666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,balanced,0.13884799679120383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,power_law_1.01,0.060601598024368285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.11223679780960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.1859007954597473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,power_law_1.01,0.060761600732803345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.1768895983695984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.1859455943107605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,balanced,0.5815680027008057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,power_law_1.01,0.0610368013381958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,balanced,0.1600266695022583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.1638592004776001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.18769919872283936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,balanced,0.6434933344523112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.21671679019927978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,power_law_1.01,0.0637503981590271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.18865920305252076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,power_law_1.01,0.0649728000164032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.2923583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.17926399707794188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.1764224052429199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,power_law_1.01,0.0669376015663147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.4196864128112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.16918400526046753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,power_law_1.01,0.07175679802894593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.4787903785705566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.16227840185165404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,power_law_1.01,0.07612159848213196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.1590016007423401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,0.7051455974578857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,power_law_1.01,0.08981760144233704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.13876479864120483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,0.8534336090087891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,balanced,0.7508906523386637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.2600127935409546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,power_law_1.01,0.09450240135192871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.3041663885116577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,balanced,0.20756800969441733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,1.3454336166381835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,power_law_1.01,0.12327040433883667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.3150784015655518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,balanced,0.7932480176289877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,1.8793407440185548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.49609599113464353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.6341504096984864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.01,2.614419174194336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.01,0.11824640035629272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,1,256,power_law_1.2,1.0364352226257325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.01,0.16128640174865722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,1,256,power_law_1.2,1.3371456146240235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,balanced,0.252618670463562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.01,4.395872116088867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.01,0.20288639068603515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,1,256,power_law_1.2,2.0196352005004883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,1,256,power_law_1.2,3.2642494201660157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.01,9.073107147216797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,balanced,0.9251840114593506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,1,256,power_law_1.2,6.325120162963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.01,0.2781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.01,0.36172800064086913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,1,256,power_law_1.2,7.301689910888672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,1,256,power_law_1.2,10.435135650634766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.01,0.4466815948486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.01,0.6104000091552735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,power_law_1.2,18.49571838378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,1,256,balanced,1.2546292940775554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,balanced,0.35256532828013104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.11329280138015747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.01,0.898739242553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.11958400011062623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,power_law_1.2,44.958944702148436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.12216320037841796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.12136960029602051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.01,1.0868351936340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.1177664041519165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,balanced,1.4490879376729329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.1253376007080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.1217087984085083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,balanced,0.44463467597961426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.12083200216293336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.1230463981628418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.11589759588241577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,power_law_1.01,1.5793984413146973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.11500799655914307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.11333119869232178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.1114240050315857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.10883200168609619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.10922880172729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.01,2.120652770996094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.17057280540466307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.1634112000465393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.01,4.22883186340332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,balanced,0.5559893449147543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.2069119930267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.27726719379425047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.36399359703063966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.5667903900146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.7066239833831787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,1.1440511703491212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,1,256,balanced,2.4576212565104165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,1.5951423645019531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,2.619820785522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,3.740991973876953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,1,256,power_law_1.2,4.652716827392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,balanced,2.887493451436361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,balanced,0.8388266563415527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,1,256,power_law_1.2,8.528614044189453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,1,256,power_law_1.2,22.0919677734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,1,256,power_law_1.2,0.0517632007598877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,1,256,power_law_1.2,0.05244799852371216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,1,256,power_law_1.2,0.05259519815444946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,1,256,power_law_1.2,0.0571008026599884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,1,256,power_law_1.2,0.058156800270080564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,1,256,power_law_1.2,0.05952640175819397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,1,256,power_law_1.2,0.059008002281188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,1,256,power_law_1.2,0.06046079993247986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,1,256,power_law_1.2,0.06092159748077393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,1,256,power_law_1.2,0.06232320070266724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,1,256,power_law_1.2,0.06389120221138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,1,256,power_law_1.2,0.06856319904327393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,balanced,1.6894346872965496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,1,256,power_law_1.2,0.07047039866447449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,1,256,power_law_1.2,0.07519999742507935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,1,256,power_law_1.2,0.08973439931869506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,1,256,power_law_1.2,0.0945792019367218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,1,256,power_law_1.2,0.1133247971534729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,1,256,power_law_1.2,0.15202560424804687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,balanced,0.11993599931399028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.2,0.15034879446029664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,balanced,0.11528533697128296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.2,0.21749119758605956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.2,0.27698559761047364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,balanced,0.11892267068227132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,balanced,0.1218986709912618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,balanced,0.12168000141779582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.2,0.42076802253723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,balanced,0.07747200131416321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.2,0.6319744110107421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,balanced,0.2055466572443644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,balanced,0.07852266728878021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,balanced,0.08021866778532664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,balanced,0.21312532822291055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,balanced,0.08171199758847554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,balanced,0.20977065960566202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,balanced,0.08084799846013387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.2,0.7315264225006104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,balanced,0.1293280025323232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,balanced,0.20672533909479776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.2,1.001529598236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,balanced,0.12538133064905801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,balanced,0.2028533418973287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,balanced,0.12917332847913107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,balanced,0.19723200798034668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,balanced,0.12871999541918436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,balanced,0.126720001300176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,balanced,0.21201066176096597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.2,1.4766655921936036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,balanced,0.13266666730244955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,balanced,0.19633066654205322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,balanced,0.13110400239626566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,balanced,0.19582400719324747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,balanced,0.13548266887664795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.2,2.051744079589844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,balanced,0.13054933150609335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,balanced,0.19597333669662476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,balanced,0.13988266388575235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,balanced,0.2117919921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,balanced,0.13778666655222574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,balanced,0.20286399126052856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,1,256,power_law_1.2,3.155084800720215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,balanced,0.1418453355630239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,balanced,0.20517333348592123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,balanced,0.1497813363869985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,balanced,0.2046453356742859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.2,4.176652908325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,balanced,0.15549866358439127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,balanced,0.2063200076421102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.2,9.6202880859375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,balanced,0.175818661848704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,balanced,0.2058239976565043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,balanced,0.18433600664138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,balanced,0.2084853251775106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,balanced,0.21287467082341513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,balanced,0.20220265785853067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,balanced,0.23745600382486978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,balanced,0.3645813465118408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,balanced,0.36946133772532147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,balanced,0.35309334595998126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,balanced,0.04457066456476847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,balanced,0.4141706625620524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.01,0.19630080461502075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,balanced,0.04478933413823446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,balanced,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,balanced,0.0470773329337438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.01,0.19575040340423583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,balanced,0.04817600051561991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,balanced,0.05890133480230967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.01,0.16247040033340454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,balanced,0.060218666990598045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,balanced,0.5126133362452189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,balanced,0.06099733213583628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.01,0.17828480005264283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,balanced,0.061066667238871254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,balanced,0.5937013228734335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,balanced,0.06189866860707601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.01,0.17904640436172486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,balanced,0.06277866661548615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.01,0.12437119483947753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,balanced,0.06286400059858958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.01,0.1971392035484314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,balanced,0.06454933186372121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.01,0.12055679559707641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.01,0.19925119876861572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,balanced,0.06518400212128957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.01,0.12360320091247559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,balanced,0.07106133302052815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.01,0.2039936065673828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.01,0.12564480304718018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,balanced,0.07133333384990692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,balanced,0.6712480386098226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,power_law_1.01,0.05368959903717041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,balanced,0.0754613329966863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.01,0.19701759815216063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.01,0.12282240390777588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,balanced,0.7697493235270182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,power_law_1.01,0.052723199129104614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.01,0.19404799938201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.01,0.12830719947814942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,power_law_1.01,0.052665597200393675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,balanced,0.08339200417200725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.01,0.1902783989906311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.01,0.12811520099639892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,power_law_1.01,0.053478401899337766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.01,0.1267135977745056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.01,0.1886016011238098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,power_law_1.01,0.057760000228881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.01,0.1268928050994873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.01,0.1915519952774048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,power_law_1.01,0.05920640230178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.01,0.1807935953140259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.01,0.12675199508666993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,power_law_1.01,0.0599295973777771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.01,0.18802560567855836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.01,0.1264448046684265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,balanced,0.08995200196901958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,balanced,0.7966826756795248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,power_law_1.01,0.06125440001487732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.01,0.17411199808120728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.01,0.12524800300598143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,balanced,0.9481066862742106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,balanced,0.10405866305033366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.01,0.16651519536972045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,power_law_1.01,0.06117759943008423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.01,0.1264256000518799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.01,0.21070079803466796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,power_law_1.01,0.06183040142059326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.01,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,balanced,0.11494933565457661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.01,0.2514879941940308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.01,0.1275264024734497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,power_law_1.01,0.06466559767723083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.01,0.3081088066101074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.01,0.12475520372390747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,power_law_1.01,0.0662015974521637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.01,0.3823168039321899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.01,0.1244096040725708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,power_law_1.01,0.0676479995250702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,2,128,power_law_1.2,0.19189120531082154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.01,0.49105281829833985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.01,0.1411072015762329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,power_law_1.01,0.07170559763908387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,2,128,power_law_1.2,0.19507839679718017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.01,0.17522560358047484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.01,0.5917119979858398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,power_law_1.01,0.07850239872932434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,balanced,0.1421173314253489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,2,128,power_law_1.2,0.11390080451965331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.01,0.21966080665588378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.01,0.8490880012512207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,power_law_1.01,0.08298239707946778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,2,128,power_law_1.2,0.17754240036010743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.01,0.2558784008026123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.01,1.0811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,power_law_1.01,0.09789440035820007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,balanced,0.16487999757130942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,2,128,power_law_1.2,0.18791040182113647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.01,0.3685312032699585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.01,1.7617855072021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,2,128,power_law_1.2,0.19735039472579957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.01,0.4250432014465332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,power_law_1.01,0.11111680269241334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,balanced,1.2428320248921711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,balanced,1.4838186899820964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,2,128,power_law_1.2,0.1991744041442871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.01,2.3015487670898436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.01,0.6581952095031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,2,128,power_law_1.2,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.01,0.8472512245178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.01,3.1408639907836915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,2,128,power_law_1.2,0.19434880018234252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,power_law_1.01,0.12012159824371338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,balanced,0.21675733725229898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.01,1.1588671684265137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,2,128,power_law_1.2,0.19141759872436523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,power_law_1.01,0.14906879663467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.01,5.411923217773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.01,1.7443456649780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,2,128,power_law_1.2,0.18496639728546144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,power_law_1.01,0.1923840045928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.01,2.004012870788574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,2,128,power_law_1.2,0.18305280208587646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.01,11.247628784179687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,balanced,0.26499199867248535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,2,128,power_law_1.2,0.18812160491943358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.01,3.1474239349365236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,power_law_1.01,0.24532480239868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,2,128,power_law_1.2,0.18024959564208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,power_law_1.01,0.3228480100631714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,2,128,power_law_1.2,0.17386239767074585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.01,7.49200668334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,2,128,power_law_1.2,0.17448320388793945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,power_law_1.01,0.4458943843841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,2,128,power_law_1.2,0.1985152006149292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,power_law_1.01,0.5878528118133545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,2,128,power_law_1.2,0.2288640022277832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,2,128,power_law_1.2,0.27842559814453127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,balanced,0.37346665064493817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,2,128,power_law_1.2,0.35149440765380857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,power_law_1.01,0.8326592445373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,2,128,power_law_1.2,0.48821120262145995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,power_law_1.01,1.067187213897705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,2,128,power_law_1.2,0.6554751873016358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,2,128,power_law_1.2,0.7376704216003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,2,128,power_law_1.2,1.118387222290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,power_law_1.01,1.3590720176696778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,2,128,power_law_1.2,2.0378559112548826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,balanced,0.4726133346557617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,power_law_1.01,2.3520576477050783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,2,128,power_law_1.2,3.3102527618408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,2,128,power_law_1.2,0.12416000366210937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,power_law_1.01,4.495673751831054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,2,128,power_law_1.2,4.1160320281982425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,2,128,power_law_1.2,0.12028160095214843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,balanced,2.9878133138020835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,2,128,power_law_1.2,0.0871936023235321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,2,128,power_law_1.2,4.805433654785157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,2,128,power_law_1.2,0.117740797996521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,balanced,2.5718026161193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,2,128,power_law_1.2,7.3444160461425785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,2,128,power_law_1.2,0.1214784026145935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,2,128,power_law_1.2,0.1277119994163513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,2,128,power_law_1.2,0.1272447943687439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,balanced,0.5888106822967529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,2,128,power_law_1.2,23.78044738769531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,2,128,power_law_1.2,0.12862080335617065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,2,128,power_law_1.2,0.12513279914855957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,2,128,power_law_1.2,0.12392319440841675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,2,128,power_law_1.2,0.12692480087280272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,2,128,power_law_1.2,0.12710399627685548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,2,128,power_law_1.2,0.12770559787750244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,2,128,power_law_1.2,0.12375680208206177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,2,128,power_law_1.2,0.12517759799957276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,2,128,power_law_1.2,0.11847039461135864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,2,128,power_law_1.2,0.1437376022338867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,2,128,power_law_1.2,0.16102399826049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,balanced,0.9207146962483724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,2,128,power_law_1.2,0.21441280841827393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,2,128,power_law_1.2,0.24749441146850587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,2,128,power_law_1.2,0.31120638847351073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,2,128,power_law_1.2,0.40286078453063967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,2,128,power_law_1.2,0.5745535850524902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,2,128,power_law_1.2,0.9102463722229004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,2,128,power_law_1.2,1.0789759635925293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,2,128,power_law_1.2,1.7473920822143554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,2,128,power_law_1.2,2.597849655151367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,2,128,power_law_1.2,3.35335693359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,2,128,power_law_1.2,5.322899246215821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,2,128,power_law_1.2,13.15984649658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,balanced,1.8437066078186035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,balanced,0.08566932876904805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,balanced,0.07646400233109792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,balanced,0.08079466720422109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,balanced,0.08117866516113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,2,128,power_law_1.2,0.05591679811477661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,balanced,0.10682132840156555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,balanced,0.1962826649347941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,2,128,power_law_1.2,0.05265920162200928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,balanced,0.20759467283884683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,2,128,power_law_1.2,0.04933120012283325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,balanced,0.20456000169118246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,balanced,0.19620800018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,2,128,power_law_1.2,0.05469440221786499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,balanced,0.20444266001383463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,2,128,power_law_1.2,0.058412802219390866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,2,128,power_law_1.2,0.05803520083427429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,balanced,0.2158986727396647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,2,128,power_law_1.2,0.060236799716949466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,balanced,0.20174400011698404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,2,128,power_law_1.2,0.0609279990196228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,balanced,0.07085866729418437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,balanced,0.2067413330078125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,2,128,power_law_1.2,0.061350399255752565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,balanced,0.07245866457621257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,balanced,0.1905440092086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,2,128,power_law_1.2,0.06331520080566407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,balanced,0.07292800148328145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,balanced,0.20124799013137817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,2,128,power_law_1.2,0.06506879925727845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,balanced,0.07371733089288075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,balanced,0.08206933240095775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,balanced,0.20007999738057455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,2,128,power_law_1.2,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,balanced,0.1311893363793691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,balanced,0.19738133748372397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,2,128,power_law_1.2,0.06933119893074036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,balanced,0.1260373294353485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,balanced,0.21740800142288208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,2,128,power_law_1.2,0.07374079823493958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,balanced,0.12804800271987915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,2,128,power_law_1.2,0.08440319895744323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,balanced,0.12170666456222534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,balanced,0.1900426745414734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,balanced,0.04397333165009817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,balanced,0.1423413356145223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,2,128,power_law_1.2,0.09082880020141601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,balanced,0.13054399689038595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.01,0.18498560190200805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.01,0.12451839447021484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,balanced,0.19979200760523477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,balanced,0.04443199932575226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,2,128,power_law_1.2,0.10334080457687378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,balanced,0.13852266470591226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,balanced,0.04452266792456309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.01,0.1893183946609497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.01,0.11980160474777221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,balanced,0.1402186652024587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,balanced,0.2037386695543925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,2,128,power_law_1.2,0.12499840259552002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,balanced,0.046613335609436035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.01,0.17452800273895264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,balanced,0.1295199990272522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.01,0.10151679515838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,balanced,0.04854933420817057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,balanced,0.13897066315015158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.01,0.13167359828948974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.01,0.09136639833450318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,balanced,0.21923200289408365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,balanced,0.14660267035166422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,balanced,0.05973333120346069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.01,0.15672320127487183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.01,0.09175040125846863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,2,128,power_law_1.2,0.13186559677124024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,balanced,0.0612960010766983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,balanced,0.14548800388971964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.01,0.16767359972000123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.01,0.11461759805679321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,balanced,0.06169066826502482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,2,128,power_law_1.2,0.18844159841537475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,balanced,0.15005333224932352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,balanced,0.2153973380724589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.01,0.20480639934539796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.01,0.12223999500274658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,balanced,0.06196266909440359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,2,128,power_law_1.2,0.23310720920562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,balanced,0.15959466497103372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.01,0.18495999574661254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.01,0.12635519504547119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,balanced,0.061648001273473106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,balanced,0.17975467443466187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.01,0.17137279510498046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.01,0.12588160037994384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,balanced,0.4047360022862752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,balanced,0.06299200157324474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.01,0.19283839464187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,2,128,power_law_1.2,0.37158401012420655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,balanced,0.19064533710479736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.01,0.1312831997871399
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,balanced,0.06444799900054932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.01,0.19074560403823854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,2,128,power_law_1.2,0.4642047882080078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.01,0.12378879785537719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.01,0.19468799829483033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,balanced,0.06594666838645935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,balanced,0.22035199403762817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.01,0.1300927996635437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,2,128,power_law_1.2,0.6357312202453613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.01,0.18249599933624266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,balanced,0.06685866912206014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,balanced,0.3646986484527588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.01,0.13103359937667847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,2,128,power_law_1.2,0.8881279945373535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.01,0.18328959941864015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,balanced,0.24594134092330933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,balanced,0.07251200079917908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.01,0.12053760290145873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.01,0.18980480432510377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,balanced,0.07330133517583211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.01,0.13494399785995484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,2,128,power_law_1.2,1.3442751884460449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.01,0.17360639572143555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.01,0.13879679441452025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,balanced,0.07715733349323273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,balanced,0.3983413378397624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.01,0.15942399501800536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,2,128,power_law_1.2,1.5755264282226562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.01,0.13292800188064574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.01,0.22064640522003173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,balanced,0.5194720029830933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.01,0.15838079452514647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,balanced,0.08527466654777527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.01,0.224070405960083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,2,128,power_law_1.2,2.198681640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.01,0.16879359483718873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.01,0.325382399559021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,balanced,0.43355735143025714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.01,0.20996479988098143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,2,128,power_law_1.2,3.2430145263671877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.01,0.34314239025115967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.01,0.26684160232543946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.01,0.4203199863433838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,2,128,power_law_1.2,7.090259552001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.01,0.3371968030929565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.01,0.5568575859069824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,balanced,0.093231995900472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.01,0.4362495899200439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.01,0.741971206665039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,balanced,0.6807573636372884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,balanced,0.10771200060844421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.01,0.6062399864196777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.01,0.9827136039733887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,balanced,0.6181600093841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.01,0.7883647918701172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.01,1.529203224182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,balanced,0.12058132886886597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,power_law_1.01,0.0588096022605896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.01,1.1077887535095214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.01,1.9071680068969727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,power_law_1.01,0.05459840297698974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.01,1.5814592361450195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.01,2.514841651916504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,power_law_1.01,0.048851200938224794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,power_law_1.01,0.05182719826698303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.01,1.8910335540771483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.01,3.6323902130126955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,4,64,power_law_1.2,0.19848959445953368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,power_law_1.01,0.05485439896583557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.01,2.8968448638916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,power_law_1.01,0.05504639744758606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,balanced,0.15195199847221375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,balanced,0.7995733420054117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,4,64,power_law_1.2,0.19631999731063843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,balanced,0.8368106683095297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.01,8.045804595947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,power_law_1.01,0.05911039710044861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,4,64,power_law_1.2,0.11705600023269654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,power_law_1.01,0.06235520243644714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.01,5.87138557434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,balanced,0.17764800786972046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,power_law_1.01,0.05950719714164734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,4,64,power_law_1.2,0.11994240283966065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,power_law_1.01,0.060812801122665405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,4,64,power_law_1.2,0.14244480133056642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,power_law_1.01,0.06585599780082703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,4,64,power_law_1.2,0.1710592031478882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,power_law_1.01,0.0661952018737793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,power_law_1.01,0.0688704013824463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,4,64,power_law_1.2,0.19866880178451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,power_law_1.01,0.0726207971572876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,4,64,power_law_1.2,0.1865407943725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,balanced,0.2379253307978312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,power_law_1.01,0.07834240198135375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,balanced,0.9868160088857015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,4,64,power_law_1.2,0.18380800485610962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,power_law_1.01,0.08082559704780579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,4,64,power_law_1.2,0.19489279985427857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,power_law_1.01,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,4,64,power_law_1.2,0.18152320384979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,balanced,0.29206933577855426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,power_law_1.01,0.11218559741973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,4,64,power_law_1.2,0.17757439613342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,4,64,power_law_1.2,0.18316160440444945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,balanced,1.3248746395111084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,4,64,power_law_1.2,0.17665280103683473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,4,64,power_law_1.2,0.18019839525222778
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,power_law_1.01,0.11964800357818603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,4,64,power_law_1.2,0.1756608009338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,power_law_1.01,0.14835840463638306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,4,64,power_law_1.2,0.22330880165100098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,power_law_1.01,0.1798784017562866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,4,64,power_law_1.2,0.26635520458221434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,4,64,power_law_1.2,0.28396799564361574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,4,64,power_law_1.2,0.336844801902771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,balanced,0.4200426737467448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,power_law_1.01,0.244051194190979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,4,64,power_law_1.2,0.38845438957214357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,power_law_1.01,0.31718399524688723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,balanced,1.5455786387125652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,4,64,power_law_1.2,0.5174464225769043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,power_law_1.01,0.4466559886932373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,4,64,power_law_1.2,0.6928832054138183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,4,64,power_law_1.2,1.231545639038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,power_law_1.01,0.6046720027923584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,4,64,power_law_1.2,1.3531776428222657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,power_law_1.01,0.844320011138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,4,64,power_law_1.2,2.3002431869506834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,balanced,0.5502773523330688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,power_law_1.01,1.0266431808471679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,4,64,power_law_1.2,2.571392059326172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,4,64,power_law_1.2,3.9306175231933596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,power_law_1.01,1.473804759979248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,4,64,power_law_1.2,5.939481735229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,power_law_1.01,2.3118976593017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,power_law_1.2,10.908108520507813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,power_law_1.01,4.824825668334961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,balanced,0.6960373719533285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,4,64,balanced,2.754847844441732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,balanced,3.1335681279500327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,balanced,1.0633227030436199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,4,64,power_law_1.2,0.12257280349731445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,4,64,power_law_1.2,0.12079360485076904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,4,64,power_law_1.2,0.07492480278015137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,4,64,power_law_1.2,0.08896639943122864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,4,64,power_law_1.2,0.09121919870376587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,4,64,power_law_1.2,0.10922240018844605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,4,64,power_law_1.2,0.1276800036430359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,4,64,power_law_1.2,0.12765439748764038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,4,64,power_law_1.2,0.12902400493621827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,4,64,power_law_1.2,0.12053120136260986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,4,64,power_law_1.2,0.058259201049804685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,4,64,power_law_1.2,0.12585599422454835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,balanced,2.1155360539754233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,balanced,0.056133334835370384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,4,64,power_law_1.2,0.1250175952911377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,4,64,power_law_1.2,0.12147200107574463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,4,64,power_law_1.2,0.05490559935569763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,balanced,0.05553600192070007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,4,64,power_law_1.2,0.10895999670028686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,balanced,0.055455997586250305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,4,64,power_law_1.2,0.04576640129089356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,4,64,power_law_1.2,0.1217087984085083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,balanced,0.057333335280418396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,4,64,power_law_1.2,0.052076798677444455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,balanced,0.06440000236034393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,4,64,power_law_1.2,0.13181439638137818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,4,64,power_law_1.2,0.05470719933509827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,balanced,0.07890133559703827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,4,64,power_law_1.2,0.05456640124320984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,4,64,power_law_1.2,0.135315203666687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,4,64,power_law_1.2,0.057708799839019775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,balanced,0.07939733564853668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,4,64,power_law_1.2,0.18451839685440063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,4,64,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,balanced,0.079434668024381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,4,64,power_law_1.2,0.18610559701919555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,4,64,power_law_1.2,0.05924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,balanced,0.0792799989382426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,4,64,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,4,64,power_law_1.2,0.24606080055236818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,balanced,0.08045866588751475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,4,64,power_law_1.2,0.06559360027313232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,4,64,power_law_1.2,0.2998143911361694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,balanced,0.0809386670589447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,4,64,power_law_1.2,0.06849920153617858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,balanced,0.08226133386294048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,4,64,power_law_1.2,0.3706943988800049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,4,64,power_law_1.2,0.0694208025932312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,balanced,0.08238400022188823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,4,64,power_law_1.2,0.07363839745521546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,4,64,power_law_1.2,0.5340864181518554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,4,64,power_law_1.2,0.08094720244407654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,balanced,0.08436800042788188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,4,64,power_law_1.2,0.7326015949249267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,4,64,power_law_1.2,0.08230400085449219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,balanced,0.08901333808898926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,4,64,power_law_1.2,0.10107519626617431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,4,64,power_law_1.2,0.9085184097290039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,balanced,0.08900800347328186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,4,64,power_law_1.2,1.3996352195739745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,balanced,0.09265066186587016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,4,64,power_law_1.2,0.11696000099182129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,balanced,0.10318400462468465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,4,64,power_law_1.2,1.837945556640625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,balanced,0.10703466335932414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,4,64,power_law_1.2,0.13502720594406128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,4,64,power_law_1.2,2.2794431686401366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,4,64,power_law_1.2,0.17411199808120728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,balanced,0.12081600228945415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,4,64,power_law_1.2,0.2269439935684204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,4,64,power_law_1.2,4.4492542266845705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,balanced,0.1327946682771047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,4,64,power_law_1.2,8.445017242431641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,4,64,power_law_1.2,0.3161855936050415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,balanced,0.15803733468055725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,4,64,power_law_1.2,0.47146239280700686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,4,64,power_law_1.2,0.5651072025299072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,balanced,0.18589866161346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,4,64,power_law_1.2,0.7513792037963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,4,64,power_law_1.2,1.1393728256225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,balanced,0.23541333278020224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,4,64,power_law_1.2,1.710393524169922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,balanced,0.04752000172932943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,balanced,0.048063998421033226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,4,64,power_law_1.2,2.212601661682129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,balanced,0.0480373352766037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,4,64,power_law_1.2,2.7053375244140625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,balanced,0.2929439942042033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,balanced,0.05420800050099691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,balanced,0.06302933394908905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,4,64,power_law_1.2,6.255750274658203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,balanced,0.06519466638565063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,balanced,0.06548800071080525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,balanced,0.06635733445485432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,balanced,0.04428799947102865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,balanced,0.06755200028419495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,balanced,0.04487466812133789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.01,0.09895679950714112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,balanced,0.0691786656777064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,balanced,0.4002506732940674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,balanced,0.04493333399295807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,balanced,0.06934933364391327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.01,0.07819520235061646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,balanced,0.04736533264319102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,balanced,0.07169599831104279
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.01,0.07070720195770264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,balanced,0.050554667909940086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,balanced,0.07387733459472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.01,0.07216640114784241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,balanced,0.062405332922935486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,balanced,0.06418133278687795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,balanced,0.07961600025494893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.01,0.06738560199737549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,balanced,0.06448000172773997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,balanced,0.07982933521270752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.01,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,balanced,0.06554666658242543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,balanced,0.08621333042780559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.01,0.06892799735069274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.01,0.07518720030784606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,balanced,0.06610666712125142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,balanced,0.5099786520004272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,balanced,0.0672159989674886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.01,0.07591040134429931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,balanced,0.09802666306495667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.01,0.06146559715270996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.01,0.07805439829826355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,balanced,0.06806399921576183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.01,0.05411199927330017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,balanced,0.10866666833559673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.01,0.07671679854393006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.01,0.055315202474594115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,balanced,0.06939200063546498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.01,0.07854080200195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,balanced,0.12942399581273398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.01,0.0565887987613678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,balanced,0.070783997575442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.01,0.07992960214614868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.01,0.08243200182914734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.01,0.05793280005455017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,balanced,0.0768693337837855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,balanced,0.14776532848676047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.01,0.08257279992103576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.01,0.061247998476028444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,balanced,0.07794666786988576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.01,0.09381759762763978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.01,0.06263039708137512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,balanced,0.18372799952824911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,balanced,0.08195200065771739
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,balanced,0.6223359902699789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.01,0.09833599925041199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.01,0.0644927978515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.01,0.12749439477920532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.01,0.06357120275497437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.01,0.13366400003433226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,balanced,0.22441067298253378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,balanced,0.09291733304659526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.01,0.0658240020275116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.01,0.1555199980735779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.01,0.0673919975757599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.01,0.17286399602890015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.01,0.22819840908050537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.01,0.07130240201950074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,balanced,0.30504000186920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.01,0.2666879892349243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.01,0.07459200024604798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.01,0.33777918815612795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.01,0.08353279829025269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,balanced,0.10216533144315083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.01,0.44206719398498534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.01,0.0867904007434845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.01,0.595078420639038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.01,0.09107840061187744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,balanced,0.11979732910792033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.01,0.7327807903289795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,balanced,0.3877813418706258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.01,0.10819200277328492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.01,0.964844799041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,balanced,0.13407466808954874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.01,0.12321280241012574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.01,1.5938176155090331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.01,0.15367679595947265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.01,0.17272959947586058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,balanced,0.9196853637695312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.01,3.2807231903076173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.01,0.22349441051483154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,balanced,0.5482720136642456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.01,0.272761607170105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,balanced,0.1726613243420919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.01,0.41775999069213865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.01,0.5216896057128906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.01,0.7202943801879883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,balanced,0.2042133410771688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.01,0.9840319633483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.01,1.1434304237365722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,balanced,0.7021439870198568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.01,1.7588607788085937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,power_law_1.01,0.06570240259170532
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,balanced,0.29390933116277057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.01,3.5711105346679686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,power_law_1.01,0.05914239883422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,power_law_1.01,0.047635200619697574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,power_law_1.01,0.05067520141601563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,balanced,0.37650132179260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,power_law_1.01,0.05614719986915588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,power_law_1.01,0.05854079723358154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,power_law_1.01,0.0617792010307312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,balanced,0.8878239790598551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,power_law_1.01,0.06345599889755249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,power_law_1.01,0.06298239827156067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,power_law_1.01,0.0648576021194458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,power_law_1.01,0.06803839802742004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,power_law_1.01,0.06982399821281433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,balanced,1.7988319396972656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,balanced,0.5381333430608114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,power_law_1.01,0.0716863989830017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,power_law_1.01,0.07775359749794006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,power_law_1.01,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,power_law_1.01,0.08906239867210389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,8,32,power_law_1.2,0.0982912003993988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,power_law_1.01,0.09631360173225403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,8,32,power_law_1.2,0.07825279831886292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,balanced,1.3363040288289387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,power_law_1.01,0.11188479661941528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,8,32,power_law_1.2,0.05824000239372253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,balanced,0.6981493631998698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,8,32,power_law_1.2,0.07256960272789001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,power_law_1.01,0.12476799488067628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,8,32,power_law_1.2,0.0664896011352539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,power_law_1.01,0.16362240314483642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,8,32,power_law_1.2,0.07287039756774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,power_law_1.01,0.18832000494003295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,8,32,power_law_1.2,0.074726402759552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,8,32,power_law_1.2,0.0744704008102417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,power_law_1.01,0.26357760429382326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,8,32,power_law_1.2,0.07511039972305297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,8,32,power_law_1.2,0.07745280265808105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,power_law_1.01,0.3911168098449707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,8,32,power_law_1.2,0.07932800054550171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,8,32,power_law_1.2,0.06732159852981567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,balanced,0.8739253679911295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,8,32,power_law_1.2,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,power_law_1.01,0.5208767890930176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,8,32,power_law_1.2,0.08321279883384705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,8,32,power_law_1.2,0.06032639741897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,power_law_1.01,0.6803520202636719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,8,32,power_law_1.2,0.08944000005722046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,8,32,power_law_1.2,0.05009920001029968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,8,32,power_law_1.2,0.09518719911575317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,8,32,power_law_1.2,0.05319679975509643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,8,32,power_law_1.2,0.09909759759902954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,power_law_1.01,1.0125056266784669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,8,32,power_law_1.2,0.05621119737625122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,8,32,power_law_1.2,0.10797439813613892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,8,32,power_law_1.2,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,power_law_1.01,1.2392000198364257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,8,32,power_law_1.2,0.13092479705810547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,8,32,power_law_1.2,0.06042879819869995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,8,32,power_law_1.2,0.13935999870300292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,8,32,power_law_1.2,0.18731520175933838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,8,32,power_law_1.2,0.06287999749183655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,power_law_1.01,1.5772543907165528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,8,32,power_law_1.2,0.18214399814605714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,8,32,power_law_1.2,0.06324480175971985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,8,32,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,power_law_1.01,2.625049591064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,8,32,power_law_1.2,0.06334720253944397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,8,32,power_law_1.2,0.3096640110015869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,8,32,power_law_1.2,0.06694399714469909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,8,32,power_law_1.2,0.4907199859619141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,power_law_1.01,5.318438339233398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,8,32,power_law_1.2,0.07134079933166504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,8,32,power_law_1.2,0.5069119930267334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,balanced,2.64355198542277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,balanced,1.3445812861124675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,8,32,power_law_1.2,0.79169921875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,8,32,power_law_1.2,0.07051519751548767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,8,32,power_law_1.2,0.8864895820617675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,8,32,power_law_1.2,0.07561600208282471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,8,32,power_law_1.2,0.08343679904937744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,8,32,power_law_1.2,1.189247989654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,8,32,power_law_1.2,0.0923583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,8,32,power_law_1.2,2.00445442199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,8,32,power_law_1.2,0.09254400134086609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,8,32,power_law_1.2,0.1168895959854126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,8,32,power_law_1.2,4.5550079345703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,8,32,power_law_1.2,0.12736639976501465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,8,32,power_law_1.2,0.1745792031288147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,8,32,power_law_1.2,0.19069440364837648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,8,32,power_law_1.2,0.24535679817199707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,8,32,power_law_1.2,0.2964224100112915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,8,32,power_law_1.2,0.4597184181213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,8,32,power_law_1.2,0.5398975849151612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,8,32,power_law_1.2,0.8400639533996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,8,32,power_law_1.2,1.1419967651367187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,8,32,power_law_1.2,1.4629823684692382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,8,32,power_law_1.2,2.3150720596313477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,8,32,power_law_1.2,0.06568959951400757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,8,32,power_law_1.2,4.654079818725586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,8,32,power_law_1.2,0.05932160019874573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,8,32,power_law_1.2,0.04539520144462585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,8,32,power_law_1.2,0.05296639800071716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,8,32,power_law_1.2,0.05544319748878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,8,32,power_law_1.2,0.060096001625061034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,8,32,power_law_1.2,0.06097919940948486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,balanced,2.670917193094889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,8,32,power_law_1.2,0.06231039762496948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,8,32,power_law_1.2,0.0643775999546051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,8,32,power_law_1.2,0.0652351975440979
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,balanced,0.05425600210825602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,8,32,power_law_1.2,0.06640639901161194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,balanced,0.0554613322019577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,8,32,power_law_1.2,0.07171840071678162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,balanced,0.05537599821885427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,8,32,power_law_1.2,0.07386239767074584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,balanced,0.059301331639289856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,8,32,power_law_1.2,0.0796992003917694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,balanced,0.06677866478761037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,8,32,power_law_1.2,0.08671360015869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,balanced,0.07747200131416321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,8,32,power_law_1.2,0.0890496015548706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,balanced,0.07916266719500224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,8,32,power_law_1.2,0.10579839944839478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,balanced,0.08029333253701527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,8,32,power_law_1.2,0.12102400064468384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,balanced,0.0803413341442744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,balanced,0.08082666496435802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,balanced,0.08179200192292531
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,8,32,power_law_1.2,0.14200960397720336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,balanced,0.08367466926574707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,8,32,power_law_1.2,0.1796223998069763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,balanced,0.08385599652926128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,8,32,power_law_1.2,0.21898241043090821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,balanced,0.086325337489446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,balanced,0.047338664531707764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,balanced,0.09079999725023906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,balanced,0.04804799954096476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,balanced,0.0913813312848409
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,8,32,power_law_1.2,0.3230079889297485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,balanced,0.04885333279768626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,balanced,0.09612799684206645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,8,32,power_law_1.2,0.43029122352600097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,balanced,0.05232533315817515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,balanced,0.10657599568367004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,balanced,0.056405335664749146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,8,32,power_law_1.2,0.6359744071960449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,balanced,0.11594667037328084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,balanced,0.06709866722424825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,balanced,0.06850666801134746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,8,32,power_law_1.2,0.770911979675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,balanced,0.13532800475756326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,balanced,0.06947733461856842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,balanced,0.06975466509660085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,balanced,0.15007999539375305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,8,32,power_law_1.2,1.128985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,balanced,0.07109866539637248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,balanced,0.07202666501204173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,8,32,power_law_1.2,1.9974592208862305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,balanced,0.07302933434645335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,balanced,0.18673600753148398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,balanced,0.07499733567237854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,8,32,power_law_1.2,1.9971839904785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,balanced,0.07627733548482259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,8,32,power_law_1.2,3.6856063842773437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,balanced,0.08236266672611237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,balanced,0.21663999557495117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,balanced,0.08418132861455281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,8,32,power_law_1.2,9.214591979980469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,balanced,0.09119466940561931
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,balanced,0.10398399829864502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,balanced,0.2847573359807332
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,balanced,0.11669333775838216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,balanced,0.13883733749389648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,balanced,0.3551573355992635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,balanced,0.160480002562205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,balanced,0.20352532466252646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,balanced,0.25255467494328815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,balanced,0.497381329536438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,balanced,0.3474773168563843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.01,0.06833279728889466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,balanced,0.44447465737660724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.01,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,balanced,0.6222560008366903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.01,0.06442880034446716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.01,0.06481279730796814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,balanced,0.04548799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.01,0.07778559923171997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,balanced,0.045935998360315956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.01,0.0536191999912262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.01,0.06974719762802124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,balanced,0.0470773329337438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,balanced,0.050794666012128196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,balanced,0.6344693501790365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.01,0.07383679747581481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.01,0.0657472014427185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,balanced,0.05584000051021576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,balanced,0.06727999945481618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.01,0.07455360293388366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.01,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,balanced,0.07010666529337566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,balanced,0.07036800185839336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.01,0.07600640058517456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.01,0.05382400155067444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,balanced,0.07094933092594147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,balanced,0.7710399627685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.01,0.07804160118103028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,balanced,0.07186666627724965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.01,0.056806397438049314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,balanced,0.0734986662864685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.01,0.07916799783706666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.01,0.06064640283584595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,balanced,0.07489599784215291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,balanced,0.07627733548482259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.01,0.06542080044746398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.01,0.08069760203361512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,balanced,0.07815999786059062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,balanced,0.8057653109232584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.01,0.066348797082901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.01,0.08247680068016053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,balanced,0.08543999989827473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,balanced,0.08711999654769897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.01,0.06631039977073669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.01,0.08654080033302307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,balanced,0.092357337474823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.01,0.09121919870376587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.01,0.0705024003982544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.01,0.10043519735336304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,balanced,0.10569066802660625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.01,0.07155200242996215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.01,0.10353920459747315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.01,0.07459200024604798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.01,0.12283519506454468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.01,0.07882239818572997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.01,0.13034240007400513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.01,0.09095680117607116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.01,0.1561535954475403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,balanced,0.12221333384513855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.01,0.09077759981155395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,balanced,1.0070079962412517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.01,0.09694079756736755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.01,0.18330880403518676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,balanced,0.1465173363685608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,balanced,1.1724106470743816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.01,0.11204479932785034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.01,0.24036478996276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,power_law_1.01,0.05860480070114136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,balanced,0.16460266709327698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.01,0.12714879512786864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,power_law_1.01,0.06903039813041686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.01,0.2878592014312744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.01,0.16368000507354735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,power_law_1.01,0.05018879771232605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,16,16,power_law_1.2,0.07087360024452209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.01,0.17630079984664918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,power_law_1.01,0.05172479748725891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.01,0.3709439992904663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.01,0.2486720085144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,16,16,power_law_1.2,0.08182399868965148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,power_law_1.01,0.05923839807510376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,balanced,0.2299306591351827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.01,0.30770559310913087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,16,16,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,power_law_1.01,0.06272640228271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.01,0.4302080154418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.01,0.4610559940338135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,16,16,power_law_1.2,0.06485120058059693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,power_law_1.01,0.07025279998779296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.01,0.5195072174072266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,balanced,0.28649065891901654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,16,16,power_law_1.2,0.0735871970653534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,power_law_1.01,0.07159039974212647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.01,0.6787839889526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,16,16,power_law_1.2,0.06821119785308838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.01,0.7902527809143066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,power_law_1.01,0.06909440159797668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,16,16,power_law_1.2,0.07374079823493958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.01,0.9252863883972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.01,1.037484836578369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,power_law_1.01,0.0746944010257721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,16,16,power_law_1.2,0.0769919991493225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,16,16,power_law_1.2,0.07702400088310242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,power_law_1.01,0.07863680124282837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.01,1.129958438873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.01,1.2632255554199219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,balanced,1.5608800252278645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,16,16,power_law_1.2,0.0772607982158661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,power_law_1.01,0.0814848005771637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,balanced,0.4179999828338623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.01,1.639232063293457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.01,1.9451583862304687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,16,16,power_law_1.2,0.07841920256614685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,power_law_1.01,0.0841152012348175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,16,16,power_law_1.2,0.08257279992103576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,power_law_1.01,0.09354239702224731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,16,16,power_law_1.2,0.08309119939804077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.01,3.866521453857422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,power_law_1.01,0.10374399423599243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.01,4.067769622802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,16,16,power_law_1.2,0.08834559917449951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,power_law_1.01,0.10823040008544922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,16,16,power_law_1.2,0.09470720291137695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,balanced,0.5216480096181234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,16,16,power_law_1.2,0.10088959932327271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,power_law_1.01,0.13127679824829103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,16,16,power_law_1.2,0.10819200277328492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,16,16,power_law_1.2,0.12466559410095215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,power_law_1.01,0.15311360359191895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,16,16,power_law_1.2,0.14052480459213257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,power_law_1.01,0.19648000001907348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,16,16,power_law_1.2,0.15896320343017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,balanced,0.7494133313496908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,power_law_1.01,0.25427200794219973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,16,16,power_law_1.2,0.2068608045578003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,16,16,power_law_1.2,0.24702720642089843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,power_law_1.01,0.33219199180603026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,balanced,2.2515786488850913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,16,16,power_law_1.2,0.31875200271606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,power_law_1.01,0.43094401359558104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,16,16,power_law_1.2,0.4401984214782715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,power_law_1.01,0.629318380355835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,balanced,0.9734880129496256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,power_law_1.01,0.8100480079650879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,16,16,power_law_1.2,0.576032018661499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,power_law_1.01,1.2299455642700194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,16,16,power_law_1.2,0.8002559661865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,power_law_1.01,1.407852840423584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,16,16,power_law_1.2,0.05381760001182556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,16,16,power_law_1.2,1.040550422668457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,16,16,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,16,16,power_law_1.2,1.3305536270141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,power_law_1.01,1.9723455429077148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,16,16,power_law_1.2,0.049856001138687135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,16,16,power_law_1.2,2.049305534362793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,power_law_1.01,2.905504035949707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,16,16,power_law_1.2,0.05541120171546936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,16,16,power_law_1.2,0.057785600423812866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,balanced,3.0607519149780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,power_law_1.01,6.406227111816406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,16,16,power_law_1.2,4.756985473632812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,balanced,1.2167359987894695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,16,16,power_law_1.2,0.05989760160446167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,16,16,power_law_1.2,0.06424319744110107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,16,16,power_law_1.2,0.06588799953460693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,16,16,power_law_1.2,0.06492800116539002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,16,16,power_law_1.2,0.06690559983253479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,16,16,power_law_1.2,0.06940799951553345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,16,16,power_law_1.2,0.07372159957885742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,16,16,power_law_1.2,0.0745855987071991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,16,16,power_law_1.2,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,16,16,power_law_1.2,0.09041280150413514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,balanced,1.8933067321777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,16,16,power_law_1.2,0.09438719749450683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,16,16,power_law_1.2,0.10016000270843506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,16,16,power_law_1.2,0.1185215950012207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,16,16,power_law_1.2,0.13317760229110717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,16,16,power_law_1.2,0.17354240417480468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,16,16,power_law_1.2,0.19224319458007813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,16,16,power_law_1.2,0.26462080478668215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,16,16,power_law_1.2,0.30433919429779055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,16,16,power_law_1.2,0.4969088077545166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,16,16,power_law_1.2,0.70414719581604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,16,16,power_law_1.2,0.8884160041809082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,16,16,power_law_1.2,1.1968959808349608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,16,16,power_law_1.2,1.4878080368041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,16,16,power_law_1.2,2.407583999633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,16,16,power_law_1.2,5.322092819213867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,balanced,3.7636000315348306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,balanced,0.05537599821885427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,256,16,16,power_law_1.2,0.05882880091667175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,balanced,0.05436799923578898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,balanced,0.05615466833114624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,256,16,16,power_law_1.2,0.06467199921607972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,balanced,0.05991466840108236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,256,16,16,power_law_1.2,0.04893440008163452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,balanced,0.04822400212287903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,balanced,0.08415466547012329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,256,16,16,power_law_1.2,0.054611200094223024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,balanced,0.04860266546408335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,balanced,0.09539199868837993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,256,16,16,power_law_1.2,0.057894402742385866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,balanced,0.05049066742261251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,balanced,0.0958186686038971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,balanced,0.055344000458717346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,balanced,0.09774933258692424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,256,16,16,power_law_1.2,0.06270080208778381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,balanced,0.06374399860699971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,balanced,0.09723200400670369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,256,16,16,power_law_1.2,0.06557440161705017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,balanced,0.08598933617273967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,balanced,0.09860799709955852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,256,16,16,power_law_1.2,0.06871680021286011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,balanced,0.08646933237711589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,balanced,0.09453333417574565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,256,16,16,power_law_1.2,0.07011839747428894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,balanced,0.08134399851163228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,balanced,0.09735467036565144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,balanced,0.08073066671689351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,256,16,16,power_law_1.2,0.0699072003364563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,balanced,0.09685867031415303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,balanced,0.08306666711966197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,256,16,16,power_law_1.2,0.07345280051231384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,balanced,0.10155199964841206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,balanced,0.08246933420499165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,256,16,16,power_law_1.2,0.07955200076103211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,balanced,0.10632000366846721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,balanced,0.08374399940172832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,balanced,0.08695466319719951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,256,16,16,power_law_1.2,0.08309760093688964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,balanced,0.10385599732398987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,balanced,0.08868267138799031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,balanced,0.11485866705576579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,256,16,16,power_law_1.2,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,balanced,0.09650666515032451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,balanced,0.12169067064921062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,256,16,16,power_law_1.2,0.10144000053405762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,balanced,0.09778666496276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,balanced,0.13404267032941183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,balanced,0.1065120001633962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,256,16,16,power_law_1.2,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,balanced,0.11876799662907918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,256,16,16,power_law_1.2,0.11537920236587525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,balanced,0.15635733803113303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.01,0.06399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.01,0.05433599948883057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,balanced,0.13483200470606485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,balanced,0.1781546672185262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.01,0.05571200251579285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.01,0.063155198097229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,256,16,16,power_law_1.2,0.13727999925613404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,balanced,0.15872533122698465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.01,0.050918400287628174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.01,0.058220797777175905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,balanced,0.22712000211079916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.01,0.057030397653579715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,balanced,0.18525334199269614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.01,0.06539520025253295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,256,16,16,power_law_1.2,0.1644544005393982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.01,0.06546559929847717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.01,0.0759872019290924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.01,0.06694399714469909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,256,16,16,power_law_1.2,0.22168960571289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,balanced,0.27776533365249634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,balanced,0.24736533562342325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.01,0.07344639897346497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.01,0.07484800219535828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.01,0.08932480216026306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,256,16,16,power_law_1.2,0.28596479892730714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.01,0.07608320116996765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.01,0.08775039911270141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.01,0.07527040243148804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,balanced,0.31067200501759845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.01,0.07975040078163147
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.01,0.08913919925689698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,256,16,16,power_law_1.2,0.4242239952087402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,balanced,0.3794879913330078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.01,0.08321279883384705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.01,0.0908735990524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,256,16,16,power_law_1.2,0.5403903961181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.01,0.08353279829025269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.01,0.09875839948654175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.01,0.08861439824104309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,balanced,0.43592532475789386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.01,0.09512959718704224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.01,0.09875199794769288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,256,16,16,power_law_1.2,0.7758592128753662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.01,0.10680320262908935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.01,0.10139520168304443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,balanced,0.488810658454895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,256,16,16,power_law_1.2,1.0757504463195802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.01,0.1124735951423645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.01,0.10251519680023194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.01,0.10979199409484863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,256,16,16,power_law_1.2,1.4990592002868652
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.01,0.11713279485702514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.01,0.129312002658844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,balanced,0.5677280028661092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.01,0.1427135944366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.01,0.12355200052261353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,256,16,16,power_law_1.2,2.106719970703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.01,0.18387839794158936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.01,0.11521919965744018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.01,0.21431679725646974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.01,0.13267199993133544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,256,16,16,power_law_1.2,2.3085567474365236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.01,0.28643839359283446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,balanced,0.7096426486968994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.01,0.1431488037109375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.01,0.3561216115951538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.01,0.4942272186279297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.01,0.17642879486083984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,256,16,16,power_law_1.2,4.786329650878907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.01,0.6539135932922363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.01,0.19802240133285523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,balanced,0.8227466742197672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.01,0.9376640319824219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.01,0.26698880195617675
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,256,16,16,power_law_1.2,9.005522918701171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.01,1.2512127876281738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.01,0.3295167922973633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.01,1.5377984046936035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.01,0.484876823425293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.01,2.48799991607666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,balanced,0.8541333675384521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.01,0.6151936054229736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.01,4.928422546386718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.01,0.8718655586242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,balanced,1.021008014678955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.01,1.2426815986633302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.01,1.3741439819335937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.01,2.3945024490356444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,256,32,8,power_law_1.2,0.06270719766616821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.01,4.393484878540039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,balanced,1.0858559608459473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,256,32,8,power_law_1.2,0.0630079984664917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,256,32,8,power_law_1.2,0.05605120062828064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,256,32,8,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,256,32,8,power_law_1.2,0.0720255970954895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,balanced,1.2874080340067546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,256,32,8,power_law_1.2,0.08120319843292237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,256,32,8,power_law_1.2,0.08629119992256165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,256,32,8,power_law_1.2,0.08689919710159302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,256,32,8,power_law_1.2,0.08878080248832702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,256,32,8,power_law_1.2,0.09006720185279846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,256,32,8,power_law_1.2,0.09845759868621826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,256,32,8,power_law_1.2,0.10206079483032227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,256,32,8,power_law_1.2,0.10207359790802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,256,32,8,power_law_1.2,0.10931839942932128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,256,32,8,power_law_1.2,0.11592960357666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,256,32,8,power_law_1.2,0.12508800029754638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,256,32,8,power_law_1.2,0.12020479440689087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,balanced,1.6120212872823079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,256,32,8,power_law_1.2,0.13659520149230958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,256,32,8,power_law_1.2,0.15112320184707642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,256,32,8,power_law_1.2,0.20961918830871581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,256,32,8,power_law_1.2,0.2311232089996338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,balanced,1.9859894116719563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,256,32,8,power_law_1.2,0.3081984043121338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,256,32,8,power_law_1.2,0.39483520984649656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,256,32,8,power_law_1.2,0.508460807800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,256,32,8,power_law_1.2,0.6630080223083497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,256,32,8,power_law_1.2,1.0362943649291991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,256,32,8,power_law_1.2,1.2896960258483887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,256,32,8,power_law_1.2,1.77457275390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,256,32,8,power_law_1.2,2.618956756591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,power_law_1.2,5.545708847045899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,256,32,8,balanced,3.152682622273763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,balanced,3.962656021118164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,256,32,8,power_law_1.2,0.05438719987869263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,256,32,8,power_law_1.2,0.05568000078201294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,balanced,0.03492266684770584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,256,32,8,power_law_1.2,0.04997760057449341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,balanced,0.03535466641187668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,balanced,0.03681600093841553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,256,32,8,power_law_1.2,0.05697280168533325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,balanced,0.03685333331425985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,256,32,8,power_law_1.2,0.06487680077552796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,balanced,0.038032000263532005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,balanced,0.037392000357309975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,256,32,8,power_law_1.2,0.06471040248870849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,balanced,0.0388373335202535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,balanced,0.032069332897663116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,256,32,8,power_law_1.2,0.07561600208282471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,balanced,0.03669866671164831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,balanced,0.03988266736268997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,balanced,0.031141333281993866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,256,32,8,power_law_1.2,0.07464960217475891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,balanced,0.04214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,balanced,0.03183466692765554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,balanced,0.037978666524092354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,256,32,8,power_law_1.2,0.0775488018989563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,balanced,0.03730666637420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,256,32,8,power_law_1.2,0.07923840284347534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,balanced,0.03365866591533025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,balanced,0.03873066604137421
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,256,32,8,power_law_1.2,0.08195840120315552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,balanced,0.03495999922355016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,balanced,0.04029333343108495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,balanced,0.03810133288304011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,256,32,8,power_law_1.2,0.08488960266113281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,balanced,0.0443200021982193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,balanced,0.037765334049860634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,256,32,8,power_law_1.2,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,balanced,0.0402399996916453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,balanced,0.035301332672437034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,256,32,8,power_law_1.2,0.09642879962921143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,balanced,0.04165866722663244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,balanced,0.036133334040641785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,256,32,8,power_law_1.2,0.11121920347213746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,balanced,0.03752533346414566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,balanced,0.04340266684691111
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,256,32,8,power_law_1.2,0.11511679887771606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,balanced,0.03632533301909765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,256,32,8,power_law_1.2,0.11227519512176513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,balanced,0.04299733539422353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,balanced,0.03749866783618927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,256,32,8,power_law_1.2,0.1337280035018921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,balanced,0.043338666359583534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,balanced,0.04022400081157684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,256,32,8,power_law_1.2,0.1445631980895996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,balanced,0.041663999358812966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,256,32,8,power_law_1.2,0.18929920196533204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,balanced,0.0524533341328303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,256,32,8,power_law_1.2,0.21442561149597167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,balanced,0.04277333120505015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,256,32,8,power_law_1.2,0.3007999897003174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,balanced,0.05414933462937673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,256,32,8,power_law_1.2,0.40096001625061034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,balanced,0.04320000112056732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,256,32,8,power_law_1.2,0.5220352172851562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,balanced,0.04660800099372864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,balanced,0.06946666538715363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,256,32,8,power_law_1.2,0.7775872230529786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,balanced,0.04937066634496053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,256,32,8,power_law_1.2,1.093932819366455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,256,32,8,power_law_1.2,1.3390527725219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,balanced,0.06563733518123627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,balanced,0.023685333629449207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,balanced,0.07989866534868877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,256,32,8,power_law_1.2,1.7585535049438477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,balanced,0.023370665808518726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,balanced,0.023525332411130268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,256,32,8,power_law_1.2,2.7315647125244142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,balanced,0.025285333395004272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,balanced,0.07560533285140991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,balanced,0.025173333783944447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,balanced,0.026565333207448322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,256,32,8,power_law_1.2,5.963020706176758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,balanced,0.027061333258946735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,power_law_1.01,0.032467201352119446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,balanced,0.02683199942111969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,balanced,0.09726400176684062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,balanced,0.10502400000890096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,balanced,0.02703999976317088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,power_law_1.01,0.032102400064468385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,balanced,0.02735999971628189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,power_law_1.01,0.03253760039806366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,balanced,0.027637332677841187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,balanced,0.027866666515668232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,power_law_1.01,0.034143999218940735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,balanced,0.02870933214823405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,power_law_1.01,0.03456639945507049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,balanced,0.11590400338172913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,balanced,0.029088000456492107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,power_law_1.01,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,balanced,0.03150933235883713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,power_law_1.01,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,balanced,0.03084266682465871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,balanced,0.12448533376057942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,power_law_1.01,0.035846400260925296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,power_law_1.01,0.0315200001001358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,power_law_1.01,0.03608959913253784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,power_law_1.01,0.03116160035133362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,power_law_1.01,0.03857919871807099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,power_law_1.01,0.031174400448799135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,balanced,0.15500799814860025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,power_law_1.01,0.03580799996852875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,balanced,0.03201599915822347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,power_law_1.01,0.03319680094718933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,power_law_1.01,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,power_law_1.01,0.03839359879493713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,power_law_1.01,0.03353599905967712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,balanced,0.03268266717592875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,power_law_1.01,0.035743999481201175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,power_law_1.01,0.037241598963737486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,power_law_1.01,0.03635840117931366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,power_law_1.01,0.04042240083217621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,balanced,0.14945066968599954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,power_law_1.01,0.03644160032272339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,power_law_1.01,0.04126079976558685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,balanced,0.1901493271191915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,power_law_1.01,0.022412799298763275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,power_law_1.01,0.03424000144004822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,power_law_1.01,0.04746879935264588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,power_law_1.01,0.036652800440788266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,power_law_1.01,0.05382400155067444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,power_law_1.01,0.022278399765491487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,balanced,0.03766400118668874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,power_law_1.01,0.0595583975315094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,power_law_1.01,0.02234880030155182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,power_law_1.01,0.0355648010969162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,power_law_1.01,0.02426239997148514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,power_law_1.01,0.07215999960899352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,power_law_1.01,0.03548159897327423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,power_law_1.01,0.024748800694942473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,power_law_1.01,0.09351680278778077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,power_law_1.01,0.036748799681663516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,power_law_1.01,0.025772801041603087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,power_law_1.01,0.12461440563201905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,balanced,0.04321600000063578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,power_law_1.01,0.036134400963783266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,power_law_1.01,0.025779199600219727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,power_law_1.01,0.17025920152664184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,power_law_1.01,0.0380160003900528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,power_law_1.01,0.025753599405288697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,power_law_1.01,0.22201600074768066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,balanced,0.04713066418965658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,power_law_1.01,0.025798401236534117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,balanced,0.2305333415667216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,power_law_1.01,0.04056319892406464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,power_law_1.01,0.3154239892959595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,power_law_1.01,0.026105600595474242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,power_law_1.01,0.041119998693466185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,power_law_1.01,0.42442879676818845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,power_law_1.01,0.026790401339530943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,power_law_1.01,0.04776319861412048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,balanced,0.2196213404337565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,power_law_1.01,0.5200448036193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,power_law_1.01,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,power_law_1.01,0.04986239969730377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,power_law_1.01,0.8625087738037109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,power_law_1.01,0.027616000175476073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,power_law_1.01,0.05891839861869812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,power_law_1.01,0.028595200181007384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,power_law_1.01,1.9654592514038085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,balanced,0.0598880002895991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,power_law_1.01,0.06972799897193908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,power_law_1.01,0.03107840120792389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,power_law_1.01,0.09349759817123413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,power_law_1.01,0.03240959942340851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,power_law_1.01,0.12017279863357544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,power_law_1.01,0.16974079608917236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,power_law_1.01,0.03857280015945434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,power_law_1.01,0.21155838966369628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,power_law_1.01,0.042368000745773314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,balanced,0.07044800122578938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,power_law_1.01,0.049881601333618165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,power_law_1.01,0.32592000961303713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,balanced,0.34463465213775635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,power_law_1.01,0.39819519519805907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,power_law_1.01,0.05621119737625122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,power_law_1.01,0.5388607978820801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,power_law_1.01,0.07043200135231018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,power_law_1.01,0.8816960334777832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,power_law_1.01,0.08533759713172913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,power_law_1.01,1.6285055160522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,power_law_1.01,0.11064319610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,balanced,0.09249599774678548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,power_law_1.01,0.13829760551452636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,power_law_1.01,0.19116159677505493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,2,128,power_law_1.2,0.03603839874267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,balanced,0.4077226718266805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,power_law_1.01,0.26231040954589846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,2,128,power_law_1.2,0.03603839874267578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,2,128,power_law_1.2,0.03746559917926788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,balanced,0.11244266231854756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,power_law_1.01,0.3556288003921509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,2,128,power_law_1.2,0.03832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,2,128,power_law_1.2,0.037811198830604555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,2,128,power_law_1.2,0.04017280042171478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,power_law_1.01,0.4288959980010986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,2,128,power_law_1.2,0.038848000764846805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,power_law_1.01,0.7538623809814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,2,128,power_law_1.2,0.03937920033931732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,balanced,0.6512800057729086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,power_law_1.01,1.3605312347412108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,2,128,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,2,128,power_law_1.2,0.036313599348068236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,balanced,0.13461866974830627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,2,128,power_law_1.2,0.0357120007276535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,2,128,power_law_1.2,0.03664000034332275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,2,128,power_law_1.2,0.03537920117378235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,2,128,power_law_1.2,0.03609600067138672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,2,128,power_law_1.2,0.04267520010471344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,2,128,power_law_1.2,0.031564798951148984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,2,128,power_law_1.2,0.042956799268722534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,2,128,power_law_1.2,0.031839999556541446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,2,128,power_law_1.2,0.04573439955711365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,2,128,power_law_1.2,0.03113600015640259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,2,128,power_law_1.2,0.05368319749832153
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,2,128,power_law_1.2,0.03345920145511627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,2,128,power_law_1.2,0.06398079991340637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,2,128,power_law_1.2,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,2,128,power_law_1.2,0.07683200240135193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,2,128,power_law_1.2,0.03464959859848023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,2,128,power_law_1.2,0.09810559749603272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,2,128,power_law_1.2,0.036800000071525577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,2,128,power_law_1.2,0.13521280288696289
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,2,128,power_law_1.2,0.16755839586257934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,2,128,power_law_1.2,0.03664000034332275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,balanced,0.19839467604955038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,2,128,power_law_1.2,0.23623039722442626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,2,128,power_law_1.2,0.034720000624656674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,2,128,power_law_1.2,0.3352576017379761
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,2,128,power_law_1.2,0.036556801199913024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,2,128,power_law_1.2,0.48239359855651853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,2,128,power_law_1.2,0.035699200630187986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,2,128,power_law_1.2,0.640883207321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,2,128,power_law_1.2,0.03592959940433502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,2,128,power_law_1.2,0.8033727645874024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,2,128,power_law_1.2,0.036134400963783266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,2,128,power_law_1.2,1.364083194732666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,2,128,power_law_1.2,0.03646079897880554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,2,128,power_law_1.2,0.04115839898586273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,2,128,power_law_1.2,2.913222312927246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,2,128,power_law_1.2,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,2,128,power_law_1.2,0.04297600090503693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,2,128,power_law_1.2,0.0494592010974884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,2,128,power_law_1.2,0.05621119737625122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,2,128,power_law_1.2,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,2,128,power_law_1.2,0.08883839845657349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,2,128,power_law_1.2,0.12262400388717651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,2,128,power_law_1.2,0.1430848002433777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,2,128,power_law_1.2,0.22695679664611818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,2,128,power_law_1.2,0.30065920352935793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,2,128,power_law_1.2,0.41900157928466797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,2,128,power_law_1.2,0.5661056041717529
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,2,128,power_law_1.2,0.7216447830200196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,2,128,power_law_1.2,1.1346879959106446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,balanced,0.3696853319803874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,2,128,power_law_1.2,2.2246976852416993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,2,128,power_law_1.2,0.02221439927816391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,2,128,power_law_1.2,0.022227199375629426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,balanced,0.02216000109910965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,2,128,power_law_1.2,0.02220800071954727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,2,128,power_law_1.2,0.0243136003613472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,2,128,power_law_1.2,0.02462719976902008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,balanced,0.023754666248957317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,2,128,power_law_1.2,0.02566399872303009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,2,128,power_law_1.2,0.025862398743629455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,balanced,0.021914665897687275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,2,128,power_law_1.2,0.025939199328422546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,2,128,power_law_1.2,0.026035198569297792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,balanced,0.023029332359631855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,2,128,power_law_1.2,0.026502400636672974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,balanced,0.023951999843120575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,2,128,power_law_1.2,0.026848000288009644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,balanced,0.030074665943781536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,2,128,power_law_1.2,0.027590399980545043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,balanced,0.02874133239189784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,balanced,0.02514133354028066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,2,128,power_law_1.2,0.02815360128879547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,balanced,0.02882666637500127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,balanced,0.024773334463437397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,2,128,power_law_1.2,0.0301503986120224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,balanced,0.03155199935038885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,balanced,0.024901332954565685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,balanced,0.03170666595300039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,2,128,power_law_1.2,0.03310079872608185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,balanced,0.025759999950726826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,balanced,0.033786666889985405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,2,128,power_law_1.2,0.03420799970626831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,balanced,0.02531733363866806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,balanced,0.03349333256483078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,balanced,0.025802666942278545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,balanced,0.033039999504884086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,2,128,power_law_1.2,0.041529598832130435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,balanced,0.03335466732581457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,balanced,0.02595199892918269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,balanced,0.03372266640265783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,2,128,power_law_1.2,0.05278720259666443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,balanced,0.03428266694148382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,2,128,power_law_1.2,0.06267520189285278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,balanced,0.026416001220544178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,balanced,0.03454400102297465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,balanced,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,balanced,0.035605333745479584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,balanced,0.035562666753927864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,2,128,power_law_1.2,0.06888319849967957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,balanced,0.03499199946721395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,balanced,0.038693333665529885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,2,128,power_law_1.2,0.09288319945335388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,balanced,0.03513599932193756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,balanced,0.03818666686614355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,balanced,0.03584533433119456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,2,128,power_law_1.2,0.1268224000930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,balanced,0.03946666667858759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,power_law_1.01,0.021990400552749634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,2,128,power_law_1.2,0.1661120057106018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,balanced,0.037402667105197906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,power_law_1.01,0.02335360050201416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,balanced,0.040005333721637726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,balanced,0.03855466594298681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,power_law_1.01,0.021663999557495116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,balanced,0.04084266722202301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,2,128,power_law_1.2,0.19482239484786987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,power_law_1.01,0.023366400599479677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,balanced,0.04067199925581614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,balanced,0.0444213350613912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,power_law_1.01,0.023571200668811798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,2,128,power_law_1.2,0.2972223997116089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,balanced,0.022645334402720135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,balanced,0.041834667325019836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,power_law_1.01,0.02444159984588623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,balanced,0.04683200021584829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,balanced,0.022490667800108593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,power_law_1.01,0.024691200256347655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,balanced,0.022570667167504627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,power_law_1.01,0.024908800423145295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,2,128,power_law_1.2,0.41611518859863283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,balanced,0.059674665331840515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,balanced,0.02483733246723811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,power_law_1.01,0.02863360047340393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,balanced,0.024469333390394848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,2,128,power_law_1.2,0.5420544147491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,power_law_1.01,0.02996479868888855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,balanced,0.06984533369541168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,balanced,0.025978667040665943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,balanced,0.048170665899912514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,power_law_1.01,0.03111039996147156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,balanced,0.02644266684850057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,balanced,0.026261332134405773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,power_law_1.01,0.03141759932041168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,2,128,power_law_1.2,0.6510591983795166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,balanced,0.026074667771657307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,balanced,0.026901334524154663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,balanced,0.0885599950949351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,2,128,power_law_1.2,1.0481344223022462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,balanced,0.061199997862180076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,balanced,0.027349332968393963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,power_law_1.01,0.03386240005493164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,balanced,0.027493332823117573
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,2,128,power_law_1.2,2.0632768630981446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,power_law_1.01,0.03676159977912903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,balanced,0.02826133370399475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,power_law_1.01,0.037939199805259706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,balanced,0.028533334533373516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,balanced,0.10300800204277039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,balanced,0.031040000418821972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,power_law_1.01,0.038150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,balanced,0.06379200021425883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,power_law_1.01,0.030969598889350893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,balanced,0.03054400036732356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,power_law_1.01,0.04126079976558685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,power_law_1.01,0.028908801078796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,power_law_1.01,0.02903040051460266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,power_law_1.01,0.0531391978263855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,power_law_1.01,0.03175680041313171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,power_law_1.01,0.031481599807739256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,power_law_1.01,0.06407039761543273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,balanced,0.031530665854612984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,power_law_1.01,0.033036801218986514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,balanced,0.13701333602269491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,power_law_1.01,0.07455999851226806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,balanced,0.08180266618728638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,power_law_1.01,0.03283840119838714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,balanced,0.033802665770053864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,power_law_1.01,0.08444160223007202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,power_law_1.01,0.033215999603271484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,power_law_1.01,0.03326080143451691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,power_law_1.01,0.11320960521697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,balanced,0.032586666444937386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,power_law_1.01,0.13166719675064087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,power_law_1.01,0.19907840490341186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,power_law_1.01,0.03505280017852783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,power_law_1.01,0.21226880550384522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,power_law_1.01,0.03692159950733185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,power_law_1.01,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,power_law_1.01,0.26559998989105227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,balanced,0.16430399815241495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,power_law_1.01,0.040031999349594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,balanced,0.03825066735347112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,balanced,0.08955199519793193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,power_law_1.01,0.37303040027618406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,power_law_1.01,0.04175359904766083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,balanced,0.03862933317820231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,power_law_1.01,0.7105152130126953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,power_law_1.01,0.046963199973106384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,power_law_1.01,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,power_law_1.01,0.06346880197525025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,power_law_1.01,0.08677120208740234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,balanced,0.045328001181284584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,2048,768,8,128,4,64,power_law_1.2,0.02190079987049103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,power_law_1.01,0.1045632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,power_law_1.01,0.022707200050354003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,power_law_1.01,0.13292160034179687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,2048,768,8,128,4,64,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,balanced,0.05108266572157542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,power_law_1.01,0.022073599696159362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,power_law_1.01,0.15267839431762695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,2048,768,8,128,4,64,power_law_1.2,0.021356800198554994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,balanced,0.19584532578786215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,power_law_1.01,0.02240000069141388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,power_law_1.01,0.21444480419158934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,balanced,0.10333333412806193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,2048,768,8,128,4,64,power_law_1.2,0.022976000607013703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,power_law_1.01,0.024191999435424806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,power_law_1.01,0.27572479248046877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,2048,768,8,128,4,64,power_law_1.2,0.023443199694156647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,power_law_1.01,0.02462079972028732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,power_law_1.01,0.38930559158325195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,power_law_1.01,0.02595840096473694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,2048,768,8,128,4,64,power_law_1.2,0.0244159996509552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,power_law_1.01,0.026086398959159852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,power_law_1.01,0.5989247798919678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,2048,768,8,128,4,64,power_law_1.2,0.024345600605010988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,power_law_1.01,0.026291200518608095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,power_law_1.01,0.026688000559806822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,balanced,0.06557333469390869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,2048,768,8,128,4,64,power_law_1.2,0.025305598974227905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,power_law_1.01,1.1275648117065429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,power_law_1.01,0.02683520019054413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,2048,768,8,128,4,64,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,power_law_1.01,0.027219200134277345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,2048,768,8,128,4,64,power_law_1.2,0.030707201361656188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,power_law_1.01,0.02810879945755005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,2048,768,8,128,4,64,power_law_1.2,0.03089280128479004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,power_law_1.01,0.02842240035533905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,2048,768,8,128,4,64,power_law_1.2,0.031411200761795044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,balanced,0.07925333579381307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,2048,768,8,128,4,64,power_law_1.2,0.03208320140838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,power_law_1.01,0.029676800966262816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,power_law_1.01,0.033471998572349546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,2048,768,8,128,4,64,power_law_1.2,0.03442560136318207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,power_law_1.01,0.03392640054225922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,2048,768,8,128,4,64,power_law_1.2,0.03676159977912903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,2048,768,8,128,4,64,power_law_1.2,0.03713920116424561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,balanced,0.2881973385810852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,2048,768,8,128,4,64,power_law_1.2,0.039628800749778745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,balanced,0.1430186629295349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,power_law_1.01,0.0379967987537384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,2048,768,8,128,4,64,power_law_1.2,0.042956799268722534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,2048,768,8,128,4,64,power_law_1.2,0.04633600115776062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,power_law_1.01,0.04258559942245484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,2048,768,8,128,4,64,power_law_1.2,0.05467519760131836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,power_law_1.01,0.04929920136928558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,balanced,0.10479999581972758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,2048,768,8,128,4,64,power_law_1.2,0.06990079879760742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,2048,768,8,128,4,64,power_law_1.2,0.08967040181159973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,power_law_1.01,0.05694720149040222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,2048,768,8,128,4,64,power_law_1.2,0.10182399749755859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,power_law_1.01,0.06437119841575623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,2048,768,8,128,4,64,power_law_1.2,0.15484800338745117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,2048,768,8,128,4,64,power_law_1.2,0.21751680374145507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,power_law_1.01,0.08945279717445373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,2048,768,8,128,4,64,power_law_1.2,0.3034111976623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,power_law_1.01,0.11226880550384521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,2048,768,8,128,4,64,power_law_1.2,0.3233599901199341
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,2048,768,8,128,4,64,power_law_1.2,0.3659136056900024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,power_law_1.01,0.14595839977264405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,balanced,0.1297546625137329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,2048,768,8,128,4,64,power_law_1.2,0.6620800018310546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,power_law_1.01,0.17989120483398438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,power_law_1.2,1.6779071807861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,power_law_1.01,0.2876287937164307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,power_law_1.01,0.4190847873687744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,power_law_1.01,0.44464640617370604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,power_law_1.01,0.6905344009399415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,balanced,0.1549066702524821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,power_law_1.01,1.7017152786254883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,balanced,0.5360693136850992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,2048,768,8,128,4,64,balanced,0.2520693341890971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,balanced,0.22946133216222128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,2048,768,8,128,4,64,power_law_1.2,0.03130879998207092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,2048,768,8,128,4,64,power_law_1.2,0.028908801078796387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,2048,768,8,128,4,64,power_law_1.2,0.029497599601745604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,2048,768,8,128,4,64,power_law_1.2,0.03175680041313171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,2048,768,8,128,4,64,power_law_1.2,0.031795200705528257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,2048,768,8,128,4,64,power_law_1.2,0.03333120048046112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,2048,768,8,128,4,64,power_law_1.2,0.03292160034179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,2048,768,8,128,4,64,power_law_1.2,0.033107200264930726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,2048,768,8,128,4,64,power_law_1.2,0.03333120048046112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,2048,768,8,128,4,64,power_law_1.2,0.033228799700737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,2048,768,8,128,4,64,power_law_1.2,0.03466239869594574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,2048,768,8,128,4,64,power_law_1.2,0.03596160113811493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,2048,768,8,128,4,64,power_law_1.2,0.03596160113811493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,2048,768,8,128,4,64,power_law_1.2,0.0377023994922638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,2048,768,8,128,4,64,power_law_1.2,0.039603200554847715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,2048,768,8,128,4,64,power_law_1.2,0.042310398817062375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,2048,768,8,128,4,64,power_law_1.2,0.022860799729824067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,2048,768,8,128,4,64,power_law_1.2,0.04379520118236542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,2048,768,8,128,4,64,power_law_1.2,0.05023999810218811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,2048,768,8,128,4,64,power_law_1.2,0.022592000663280487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,2048,768,8,128,4,64,power_law_1.2,0.022944000363349915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,2048,768,8,128,4,64,power_law_1.2,0.05123839974403381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,balanced,0.46319464842478436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,2048,768,8,128,4,64,power_law_1.2,0.025043201446533204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,2048,768,8,128,4,64,power_law_1.2,0.061375999450683595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,2048,768,8,128,4,64,power_law_1.2,0.025312000513076784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,2048,768,8,128,4,64,power_law_1.2,0.07166720032691956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,2048,768,8,128,4,64,power_law_1.2,0.026092800498008727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,2048,768,8,128,4,64,power_law_1.2,0.10069760084152221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,2048,768,8,128,4,64,power_law_1.2,0.026316800713539125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,2048,768,8,128,4,64,power_law_1.2,0.12418559789657593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,2048,768,8,128,4,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,2048,768,8,128,4,64,power_law_1.2,0.18812160491943358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,2048,768,8,128,4,64,power_law_1.2,0.026399999856948853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,2048,768,8,128,4,64,power_law_1.2,0.22211840152740478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,2048,768,8,128,4,64,power_law_1.2,0.02675839960575104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,balanced,0.05904000004132589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,2048,768,8,128,4,64,power_law_1.2,0.027526399493217467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,2048,768,8,128,4,64,power_law_1.2,0.3344640016555786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,balanced,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,2048,768,8,128,4,64,power_law_1.2,0.028428798913955687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,2048,768,8,128,4,64,power_law_1.2,0.45165438652038575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,balanced,0.05950400233268738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,2048,768,8,128,4,64,power_law_1.2,0.028889599442481994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,balanced,0.0633493314186732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,2048,768,8,128,4,64,power_law_1.2,0.51080322265625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,2048,768,8,128,4,64,power_law_1.2,0.030169600248336793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,balanced,0.05994666616121928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,2048,768,8,128,4,64,power_law_1.2,0.033548799157142636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,2048,768,8,128,4,64,power_law_1.2,0.9561216354370117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,balanced,0.06300800045331319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,2048,768,8,128,4,64,power_law_1.2,0.03441919982433319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,balanced,0.06599999964237213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,2048,768,8,128,4,64,power_law_1.2,1.9946304321289063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,balanced,0.06723199784755707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,balanced,0.06338133414586385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,2048,768,8,128,4,64,power_law_1.2,0.04026240110397339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,balanced,0.06497066716353099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,2048,768,8,128,4,64,power_law_1.2,0.0456063985824585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,balanced,0.06431999802589417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,2048,768,8,128,4,64,power_law_1.2,0.052153599262237546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,balanced,0.05885333319505056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,balanced,0.06404800216356914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,2048,768,8,128,4,64,power_law_1.2,0.06559360027313232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,balanced,0.05914666752020518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,2048,768,8,128,4,64,power_law_1.2,0.0828544020652771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,balanced,0.067221333583196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,2048,768,8,128,4,64,power_law_1.2,0.09818879961967468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,balanced,0.0690773328145345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,2048,768,8,128,4,64,power_law_1.2,0.13218560218811035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,balanced,0.06392533580462138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,balanced,0.06347733239332835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,2048,768,8,128,4,64,power_law_1.2,0.25039360523223875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,balanced,0.06385600070158641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,2048,768,8,128,4,64,power_law_1.2,0.37959680557250974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,balanced,0.0639466643333435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,balanced,0.04594666759173075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,balanced,0.04831466575463613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,balanced,0.06043733159701029
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,2048,768,8,128,4,64,power_law_1.2,0.46645121574401854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,balanced,0.04701333244641622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,balanced,0.049423997600873314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,2048,768,8,128,4,64,power_law_1.2,0.7099199771881104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,balanced,0.09102933605511983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,balanced,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,balanced,0.05021866659323374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,balanced,0.08819199601809184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,2048,768,8,128,4,64,power_law_1.2,0.8756416320800782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,balanced,0.049509331583976746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,balanced,0.05040533343950907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,2048,768,8,128,4,64,power_law_1.2,1.099385643005371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,balanced,0.04985600213209788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,balanced,0.11668266852696736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.01,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,balanced,0.0513866643110911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,2048,768,8,128,4,64,power_law_1.2,3.386310577392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.01,0.058143997192382814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.01,0.04425599873065948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,balanced,0.04897599915663401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.01,0.058899199962615965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.01,0.04339199960231781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,balanced,0.04796266555786133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.01,0.06128000020980835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,balanced,0.13501866658528647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.01,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,balanced,0.049498667319615684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.01,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.01,0.0447488009929657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,balanced,0.05199466645717621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.01,0.06178560256958008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,balanced,0.026816000541051228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.01,0.046323201060295104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.01,0.06431360244750976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,balanced,0.05515733361244202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.01,0.062041598558425906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.01,0.04853120148181915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,balanced,0.026885333160559338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,balanced,0.05284800132115682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.01,0.06077439785003662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.01,0.048582398891448976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,balanced,0.026863999664783478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,balanced,0.054474666714668274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.01,0.060864001512527466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,balanced,0.19028266270955405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,balanced,0.028725333511829376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.01,0.04796159863471985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,balanced,0.028250666956106823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,balanced,0.05686933298905691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.01,0.060127997398376466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.01,0.04849919974803925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.01,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,balanced,0.029968000948429108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,balanced,0.05961599946022034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.01,0.047366398572921756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,balanced,0.030026666820049286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.01,0.05371519923210144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,balanced,0.029968000948429108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.01,0.04696959853172302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,balanced,0.06964266796906789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,balanced,0.03067733347415924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.01,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,balanced,0.03102933367093404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.01,0.04673280119895935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,balanced,0.07683733105659485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,balanced,0.031194667021433514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.01,0.04986880123615265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.01,0.059001600742340087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,balanced,0.03203733265399933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,balanced,0.23509865999221802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,balanced,0.0324799989660581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.01,0.05858560204505921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,balanced,0.1051626702149709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,balanced,0.03507733345031738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.01,0.07756800055503846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.01,0.0704576015472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,balanced,0.034629332522551216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.01,0.08612480163574218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.01,0.08520960211753845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.01,0.11316479444503784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,balanced,0.11641599734624226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.01,0.10537600517272949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.01,0.13223040103912354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.01,0.13456640243530274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.01,0.18851200342178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,balanced,0.03533333291610082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.01,0.16008319854736328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.01,0.2383807897567749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.01,0.3614975929260254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.01,0.23326079845428466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,balanced,0.15445866187413534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,balanced,0.03817066550254822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.01,0.44200959205627444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.01,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,balanced,0.29147199789683026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,balanced,0.037946666280428566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.01,0.7056447982788085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.01,0.4319744110107422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.01,0.9027199745178223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.01,0.6032127857208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.01,1.2561408042907716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,balanced,0.18762133518854776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.01,0.9185024261474609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.01,2.2243583679199217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.01,1.383244800567627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,balanced,0.045184001326560974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.01,4.004415893554688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.01,1.4793919563293456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,balanced,0.046997333566347756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.01,2.8146688461303713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,balanced,0.2634933392206828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.01,7.155417633056641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,balanced,0.061946665247281395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,power_law_1.01,0.02630400061607361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,power_law_1.01,0.02624639868736267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,balanced,0.4352746804555257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,balanced,0.07010666529337566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,power_law_1.01,0.0263808012008667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,power_law_1.01,0.028403198719024657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,balanced,0.3333386580149333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,power_law_1.01,0.028601598739624024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,power_law_1.01,0.029625600576400755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,power_law_1.01,0.029791998863220214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,power_law_1.01,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,power_law_1.01,0.030265599489212036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,power_law_1.01,0.030739200115203858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,power_law_1.01,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,balanced,0.08649067083994548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,power_law_1.01,0.03203200101852417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,2,128,power_law_1.2,0.062028801441192626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,power_law_1.01,0.0341376006603241
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,2,128,power_law_1.2,0.06110720038414001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,balanced,0.4100266695022583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,power_law_1.01,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,2,128,power_law_1.2,0.06106240153312683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,power_law_1.01,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,2,128,power_law_1.2,0.06382079720497132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,2,128,power_law_1.2,0.06208639740943909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,power_law_1.01,0.041171199083328246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,2,128,power_law_1.2,0.06407679915428162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,balanced,0.10337600111961365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,2,128,power_law_1.2,0.06513919830322265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,power_law_1.01,0.05329279899597168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,2,128,power_law_1.2,0.056550401449203494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,2,128,power_law_1.2,0.060889601707458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,power_law_1.01,0.07200000286102295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,2,128,power_law_1.2,0.05987200140953064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,power_law_1.01,0.07899519801139832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,2,128,power_law_1.2,0.054713600873947145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,2,128,power_law_1.2,0.051551997661590576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,2,128,power_law_1.2,0.05355520248413086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,power_law_1.01,0.09761279821395874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,balanced,0.1389226714769999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,2,128,power_law_1.2,0.06531199812889099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,power_law_1.01,0.12668800354003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,balanced,0.6273119846979777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,2,128,power_law_1.2,0.07649919986724854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,balanced,0.8362773259480795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,2,128,power_law_1.2,0.07493119835853576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,power_law_1.01,0.15020159482955933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,2,128,power_law_1.2,0.08131840229034423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,power_law_1.01,0.21942400932312012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,2,128,power_law_1.2,0.10101759433746338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,2,128,power_law_1.2,0.1316799998283386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,2,128,power_law_1.2,0.1929535984992981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,power_law_1.01,0.29672319889068605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,2,128,power_law_1.2,0.21784958839416504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,balanced,0.171999990940094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,2,128,power_law_1.2,0.32177278995513914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,power_law_1.01,0.3823103904724121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,2,128,power_law_1.2,0.4580927848815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,2,128,power_law_1.2,0.6391104221343994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,power_law_1.01,0.5200448036193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,2,128,power_law_1.2,0.9067839622497559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,2,128,power_law_1.2,0.04671359956264496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,power_law_1.01,0.7674367904663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,2,128,power_law_1.2,1.5786879539489747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,2,128,power_law_1.2,0.04795520007610321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,2,128,power_law_1.2,2.173017692565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,2,128,power_law_1.2,0.048204800486564635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,2,128,power_law_1.2,0.049439999461174014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,2,128,power_law_1.2,2.78851203918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,2,128,power_law_1.2,0.04807040095329285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,2,128,power_law_1.2,0.050937598943710326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,2,128,power_law_1.2,4.723968124389648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,2,128,power_law_1.2,0.04689280092716217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,power_law_1.01,0.844057559967041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,balanced,0.20905067523320517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,2,128,power_law_1.2,0.04865280091762543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,2,128,power_law_1.2,9.877804565429688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,2,128,power_law_1.2,0.048518401384353635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,power_law_1.01,1.429740810394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,2,128,power_law_1.2,0.04647679924964905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,2,128,power_law_1.2,0.046726399660110475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,power_law_1.01,2.9945920944213866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,2,128,power_law_1.2,0.04604800045490265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,balanced,1.2165919939676921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,2,128,power_law_1.2,0.044915199279785156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,2,128,power_law_1.2,0.05435519814491272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,2,128,power_law_1.2,0.058246397972106935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,2,128,power_law_1.2,0.05896959900856018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,2,128,power_law_1.2,0.06762880086898804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,2,128,power_law_1.2,0.08620799779891967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,balanced,0.3152746756871541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,2,128,power_law_1.2,0.10065280199050904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,2,128,power_law_1.2,0.13813120126724243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,2,128,power_law_1.2,0.18027520179748535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,2,128,power_law_1.2,0.24569599628448485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,2,128,power_law_1.2,0.34610559940338137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,2,128,power_law_1.2,0.515231990814209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,2,128,power_law_1.2,0.6579520225524902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,2,128,power_law_1.2,1.0017663955688476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,2,128,power_law_1.2,1.4649408340454102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,2,128,power_law_1.2,1.8077247619628907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,balanced,0.03389333436886469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,2,128,power_law_1.2,3.011008071899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,balanced,0.03324266771475474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,balanced,0.03509333233038584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,2,128,power_law_1.2,0.02619520127773285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,2,128,power_law_1.2,6.487974548339844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,balanced,0.036277333895365395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,balanced,0.032672000428040825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,2,128,power_law_1.2,0.026348799467086792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,balanced,0.0330079992612203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,balanced,0.033333333830038704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,2,128,power_law_1.2,0.026470398902893065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,balanced,0.03326933334271113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,balanced,0.03334933271010717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,2,128,power_law_1.2,0.028409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,balanced,0.034074666599432625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,2,128,power_law_1.2,0.02876800000667572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,balanced,0.03430933256944021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,2,128,power_law_1.2,0.02963840067386627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,balanced,0.03623466690381368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,balanced,0.043738668163617454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,2,128,power_law_1.2,0.03175039887428284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,balanced,0.042378668983777366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,2,128,power_law_1.2,0.030342400074005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,balanced,0.042405332128206887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,balanced,0.044682666659355164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,2,128,power_law_1.2,0.03033599853515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,balanced,0.047184000412623085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,2,128,power_law_1.2,0.030943998694419862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,balanced,0.047413334250450134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,balanced,0.6244639952977499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,2,128,power_law_1.2,0.03187839984893799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,balanced,0.05219733218352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,2,128,power_law_1.2,0.03487359881401062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,2,128,power_law_1.2,0.03528960049152374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,balanced,0.056261335810025535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,2,128,power_law_1.2,0.038848000764846805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,2,128,power_law_1.2,0.04286719858646393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,balanced,0.07036266724268596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,2,128,power_law_1.2,0.052172797918319705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,balanced,0.06795733173688252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,2,128,power_law_1.2,0.05964159965515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,2,128,power_law_1.2,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,2,128,power_law_1.2,0.10117759704589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,balanced,0.08839466174443562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,balanced,0.03356799980004629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,balanced,0.03204799940188726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,2,128,power_law_1.2,0.1328511953353882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,2,128,power_law_1.2,0.18876160383224488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,balanced,0.03478399912516276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,balanced,0.09171199798583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,balanced,0.038805333276589714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,balanced,0.0366239994764328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,2,128,power_law_1.2,0.2600640058517456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,balanced,0.03691199918588003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,balanced,0.036687999963760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,2,128,power_law_1.2,0.3515968084335327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,balanced,0.03711466739575068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,balanced,0.03796799977620443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,balanced,0.03847466657559077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,balanced,0.12574399511019388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,2,128,power_law_1.2,0.4752255916595459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,balanced,0.03862400104602178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,balanced,0.039146666725476585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,balanced,0.040037333965301514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,2,128,power_law_1.2,0.5985343933105469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,balanced,0.042490666111310325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,balanced,0.04212800165017446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,2,128,power_law_1.2,0.8699968338012696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,balanced,0.04398933549722036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,balanced,0.04682666560014089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,2,128,power_law_1.2,1.050163173675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,balanced,0.1439893345038096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,balanced,0.05049066742261251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,balanced,0.06418666740258534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,2,128,power_law_1.2,1.353433609008789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,balanced,0.07126399874687195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,2,128,power_law_1.2,2.125484848022461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,balanced,0.09152000149091084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,2,128,power_law_1.2,4.180511856079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,balanced,0.10246933499972026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,balanced,0.16965866088867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,balanced,0.13386666774749756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.01,0.03999359905719757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,balanced,0.026687999566396076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,balanced,0.15818132956822714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.01,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.01,0.03260799944400787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.01,0.033478400111198424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,balanced,0.02658133457104365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.01,0.03301759958267212
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.01,0.03312639892101288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,balanced,0.028373333315054577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.01,0.035648000240325925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,balanced,0.0286613330245018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.01,0.03527680039405823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,balanced,0.03012266755104065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.01,0.03540480136871338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,balanced,0.03062933435042699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,balanced,0.22031466166178384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.01,0.03612799942493439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.01,0.03282560110092163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,balanced,0.03046933313210805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.01,0.036396801471710205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,balanced,0.03033066789309184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.01,0.03284479975700379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.01,0.03678719997406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.01,0.03703039884567261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,balanced,0.24962133169174194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,balanced,0.0316746657093366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.01,0.03663359880447388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.01,0.03837440013885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,balanced,0.03187733391920725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.01,0.03699199855327606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.01,0.042412799596786496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,balanced,0.032799998919169106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.01,0.03852800130844116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.01,0.04625279903411865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,balanced,0.032986665765444435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.01,0.03948799967765808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,balanced,0.2733706633249919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.01,0.05144320130348205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,balanced,0.03639466563860575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.01,0.04081920087337494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.01,0.060192000865936277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,balanced,0.035258665680885315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.01,0.04190720021724701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.01,0.04482559859752655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.01,0.04469119906425476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.01,0.046515199542045596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.01,0.04815999865531921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.01,0.04981119930744171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.01,0.05441280007362366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.01,0.053286397457122804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,balanced,0.03665599972009659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.01,0.06276479959487916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.01,0.06783360242843628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,balanced,0.039674667020638786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.01,0.06870399713516236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.01,0.07217919826507568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,balanced,0.3309066692988078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.01,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.01,0.08732799887657165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,balanced,0.03997866561015447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.01,0.10168960094451904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.01,0.10787839889526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.01,0.1357375979423523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.01,0.13181439638137818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,power_law_1.01,0.0271232008934021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.01,0.14387840032577515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.01,0.13441280126571656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.01,0.20643200874328613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,power_law_1.01,0.026655998826026917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.01,0.24483199119567872
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,balanced,0.04840533435344696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.01,0.25905280113220214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,power_law_1.01,0.026726400852203368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.01,0.2248960018157959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.01,0.36593921184539796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,balanced,0.05330666899681091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,power_law_1.01,0.02865920066833496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.01,0.3591423988342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.01,0.4870336055755615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,4,64,power_law_1.2,0.03387520015239716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,power_law_1.01,0.029203200340270997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.01,0.42162561416625977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,4,64,power_law_1.2,0.03293440043926239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,power_law_1.01,0.030124801397323608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.01,0.6000319957733155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,4,64,power_law_1.2,0.03293440043926239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.01,0.4206528186798096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,power_law_1.01,0.03049600124359131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,4,64,power_law_1.2,0.03459199965000152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,balanced,0.06780266761779785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.01,0.9866559982299805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,4,64,power_law_1.2,0.034969601035118106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.01,0.7114048004150391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,power_law_1.01,0.030534398555755616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,4,64,power_law_1.2,0.03251200020313263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,balanced,0.5019253492355347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,4,64,power_law_1.2,0.03283199965953827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.01,2.1580223083496093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,power_law_1.01,0.03084160089492798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.01,1.8374143600463868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,4,64,power_law_1.2,0.04213759899139404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,balanced,0.07772799829641978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,balanced,0.46053866545359295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,power_law_1.01,0.03121280074119568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,4,64,power_law_1.2,0.041868799924850465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,power_law_1.01,0.03343360126018524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,4,64,power_law_1.2,0.044038400053977966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,power_law_1.01,0.03477759957313538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,4,64,power_law_1.2,0.051635199785232545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,power_law_1.01,0.035872000455856326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,4,64,power_law_1.2,0.058937597274780276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,4,64,power_law_1.2,0.07098879814147949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,power_law_1.01,0.03653759956359863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,4,64,power_law_1.2,0.04497919976711273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,power_law_1.01,0.04097279906272888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,4,64,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,power_law_1.01,0.043315199017524716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,4,64,power_law_1.2,0.04993920028209686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,balanced,0.09868266185124715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,4,64,power_law_1.2,0.061561602354049685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,4,64,power_law_1.2,0.0707584023475647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,power_law_1.01,0.05542399883270264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,4,64,power_law_1.2,0.08067839741706848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,power_law_1.01,0.061286401748657224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,4,64,power_law_1.2,0.11264640092849731
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,power_law_1.01,0.07096319794654846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,4,64,power_law_1.2,0.12031999826431275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,4,64,power_law_1.2,0.1942911982536316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,balanced,0.1197119951248169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,4,64,power_law_1.2,0.18774399757385254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,4,64,power_law_1.2,0.31658880710601806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,power_law_1.01,0.08929280042648316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,4,64,power_law_1.2,0.4247615814208984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,power_law_1.01,0.11324160099029541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,4,64,power_law_1.2,0.5428224086761475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,4,64,power_law_1.2,0.6426432132720947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,power_law_1.01,0.1552832007408142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,4,64,power_law_1.2,0.9461695671081543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,power_law_1.01,0.19227520227432252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,4,64,power_law_1.2,1.6181631088256836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,4,64,power_law_1.2,3.197465515136719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,balanced,0.16671466827392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,power_law_1.01,0.26796159744262693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,power_law_1.01,0.3712768077850342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,balanced,0.9632746378580729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,power_law_1.01,0.5836671829223633
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,power_law_1.01,0.7624896049499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,balanced,0.20811732610066733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,power_law_1.01,0.884614372253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,4,64,power_law_1.2,0.040006399154663086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,power_law_1.01,1.2730560302734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,4,64,power_law_1.2,0.03319680094718933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,power_law_1.01,2.824473571777344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,4,64,power_law_1.2,0.03429119884967804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,4,64,power_law_1.2,0.03570559918880463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,4,64,power_law_1.2,0.03746559917926788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,4,64,power_law_1.2,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,4,64,power_law_1.2,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,balanced,0.25685866673787433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,4,64,power_law_1.2,0.03675520122051239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,4,64,power_law_1.2,0.03681280016899109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,4,64,power_law_1.2,0.037171199917793274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,4,64,power_law_1.2,0.03863680064678192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,4,64,power_law_1.2,0.040403199195861814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,4,64,power_law_1.2,0.041254401206970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,4,64,power_law_1.2,0.042828801274299624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,4,64,power_law_1.2,0.04620159864425659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,4,64,power_law_1.2,0.05161600112915039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,4,64,power_law_1.2,0.05235199928283692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,4,64,power_law_1.2,0.06685439944267273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,4,64,power_law_1.2,0.07399680018424988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,balanced,0.4134773413340251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,4,64,power_law_1.2,0.0893119990825653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,4,64,power_law_1.2,0.12087039947509766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,4,64,power_law_1.2,0.17679359912872314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,4,64,power_law_1.2,0.17590399980545043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,4,64,power_law_1.2,0.2804287910461426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,4,64,power_law_1.2,0.36947200298309324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,4,64,power_law_1.2,0.5123775959014892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,4,64,power_law_1.2,0.8189184188842773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,4,64,power_law_1.2,1.0560832023620605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,4,64,power_law_1.2,1.517529582977295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,4,64,power_law_1.2,2.8619712829589843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,balanced,0.033733333150545754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,balanced,0.03305600086847941
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,balanced,0.7875520388285319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,balanced,0.02938133229811986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,balanced,0.029343999922275543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,balanced,0.031898667414983116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,balanced,0.030975999931494396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,balanced,0.03194666653871536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,balanced,0.0325546662012736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,4,64,power_law_1.2,0.02707200050354004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,balanced,0.034789333740870156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,balanced,0.036544000109036766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,balanced,0.03654933224121729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,4,64,power_law_1.2,0.026495999097824095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,balanced,0.03719999889532725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,balanced,0.03909866760174433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,balanced,0.03721600025892258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,4,64,power_law_1.2,0.026918399333953857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,balanced,0.03708266715208689
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,balanced,0.03718933214743932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,4,64,power_law_1.2,0.028966400027275085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,balanced,0.03825066735347112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,balanced,0.039279999832312264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,balanced,0.03910933434963226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,4,64,power_law_1.2,0.029600000381469725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,balanced,0.03998400022586187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,balanced,0.03698666642109553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,balanced,0.04404266675313314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,4,64,power_law_1.2,0.030054399371147157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,balanced,0.0379573330283165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,balanced,0.044341335693995156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,4,64,power_law_1.2,0.030508801341056824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,balanced,0.0382080003619194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,balanced,0.045498669147491455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,4,64,power_law_1.2,0.03108479976654053
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,balanced,0.04524266719818115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,balanced,0.038176000118255615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,4,64,power_law_1.2,0.03152639865875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,balanced,0.048453330993652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,balanced,0.03897066662708918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,4,64,power_law_1.2,0.032287999987602234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,balanced,0.0397173340121905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,balanced,0.04953599969546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,4,64,power_law_1.2,0.033523198962211606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,balanced,0.04308799902598063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,balanced,0.05367999772230784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,4,64,power_law_1.2,0.03521920144557953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,balanced,0.04257066547870636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,4,64,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,balanced,0.05916800101598104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,balanced,0.045381332437197365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,4,64,power_law_1.2,0.03962239921092987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,balanced,0.07542933523654938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,4,64,power_law_1.2,0.04195840060710907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,balanced,0.04953599969546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,4,64,power_law_1.2,0.0456959992647171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,balanced,0.050944000482559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,balanced,0.07539199789365132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,balanced,0.066170667608579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,4,64,power_law_1.2,0.05675519704818725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,4,64,power_law_1.2,0.07472000122070313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,balanced,0.07484800120194753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.01,0.029702401161193846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,balanced,0.09975999593734741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,4,64,power_law_1.2,0.08823680281639099
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.01,0.02913280129432678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,balanced,0.09500799576441447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.01,0.030636799335479737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.01,0.035776001214981076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.01,0.0321152001619339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,4,64,power_law_1.2,0.10512000322341919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.01,0.032915198802948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,balanced,0.10595200459162395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.01,0.03607679903507233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,balanced,0.10717866818110149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,balanced,0.026746665438016255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,4,64,power_law_1.2,0.1384703993797302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.01,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.01,0.03451519906520843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,balanced,0.026394667724768322
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.01,0.034944000840187076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,4,64,power_law_1.2,0.22846720218658448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.01,0.04178560078144074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,balanced,0.02651199946800868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.01,0.03627519905567169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,balanced,0.14480533202489218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.01,0.044352000951766966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,4,64,power_law_1.2,0.3620800018310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.01,0.03637759983539581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,balanced,0.028938665986061096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.01,0.046911999583244324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.01,0.03651840090751648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,balanced,0.029114666084448498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,balanced,0.15250666936238608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.01,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.01,0.05199360251426697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,balanced,0.030576000610987347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,4,64,power_law_1.2,0.5168255805969239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.01,0.038464000821113585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,balanced,0.031136001149813335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.01,0.05617280006408691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.01,0.03976959884166718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,balanced,0.17264533042907715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,balanced,0.030778666337331135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.01,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.01,0.04154239892959595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,4,64,power_law_1.2,0.589958381652832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,balanced,0.0306986669699351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.01,0.041145598888397215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.01,0.045126399397850035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.01,0.04359680116176605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,balanced,0.03143466760714849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.01,0.04834559857845307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.01,0.04721280038356781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,4,64,power_law_1.2,0.9080384254455567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,balanced,0.03183466692765554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.01,0.05015040040016174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.01,0.04925439953804016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,balanced,0.03295466552178065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.01,0.053299200534820554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,balanced,0.17965867122014365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.01,0.05203840136528015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.01,0.061267197132110596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,4,64,power_law_1.2,1.2072768211364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,balanced,0.03335466732581457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,balanced,0.24381333589553833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.01,0.060787200927734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.01,0.06668800115585327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,balanced,0.03398400048414866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,4,64,power_law_1.2,1.8008832931518555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.01,0.08913919925689698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.01,0.06639999747276307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.01,0.0981440007686615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,4,64,power_law_1.2,3.0083776473999024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.01,0.08250240087509156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.01,0.12686079740524292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,balanced,0.03743999948104223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.01,0.15774719715118407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.01,0.09166719913482665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,4,64,power_law_1.2,5.562047958374023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,balanced,0.037061333656311035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.01,0.2207808017730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.01,0.11790720224380494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.01,0.2793855905532837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.01,0.1313599944114685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.01,0.42344322204589846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,balanced,0.3066026568412781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.01,0.1723647952079773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.01,0.4876992225646973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,balanced,0.2121280034383138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.01,0.2345344066619873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.01,0.6109504222869873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,balanced,0.03850133220354716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.01,0.970400047302246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.01,0.36332800388336184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,balanced,0.04320533573627472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.01,0.43843841552734375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.01,2.196352005004883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,balanced,0.04433600107828776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.01,0.4889664173126221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.01,0.774726390838623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,balanced,0.05422399938106537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.01,1.6213632583618165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,balanced,0.3705759843190511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,balanced,0.06192533175150553
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,balanced,0.08134399851163228
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,balanced,0.31271467606226605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,balanced,0.09460266431172688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,power_law_1.01,0.02876800000667572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,power_law_1.01,0.026796799898147584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,power_law_1.01,0.026604801416397095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,power_law_1.01,0.029241600632667543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,power_law_1.01,0.029811200499534608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,balanced,0.1246560017267863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,balanced,0.5663839975992838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,power_law_1.01,0.03088639974594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,power_law_1.01,0.031404799222946166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,power_law_1.01,0.03224959969520569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,power_law_1.01,0.03276160061359405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,power_law_1.01,0.03491199910640717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,balanced,0.15801067153612772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,power_law_1.01,0.03711360096931458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,power_law_1.01,0.04007039964199066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,8,32,power_law_1.2,0.03663359880447388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,power_law_1.01,0.04352000057697296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,8,32,power_law_1.2,0.028799998760223388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,power_law_1.01,0.0455487996339798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,8,32,power_law_1.2,0.029504001140594482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,8,32,power_law_1.2,0.031481599807739256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,8,32,power_law_1.2,0.031839999556541446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,8,32,power_law_1.2,0.03589119911193848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,balanced,0.23430399099985758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,power_law_1.01,0.05399680137634277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,8,32,power_law_1.2,0.035897600650787356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,8,32,power_law_1.2,0.04614399969577789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,power_law_1.01,0.06764159798622131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,8,32,power_law_1.2,0.04656000137329101
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,power_law_1.01,0.0759168028831482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,8,32,power_law_1.2,0.04850560128688812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,balanced,0.581216017405192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,8,32,power_law_1.2,0.055232000350952146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,power_law_1.01,0.0858240008354187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,8,32,power_law_1.2,0.05783039927482605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,power_law_1.01,0.11175040006637574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,8,32,power_law_1.2,0.07493119835853576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,8,32,power_law_1.2,0.04604159891605377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,power_law_1.01,0.1658687949180603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,8,32,power_law_1.2,0.05028480291366577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,power_law_1.01,0.24119040966033936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,8,32,power_law_1.2,0.05123199820518494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,8,32,power_law_1.2,0.0525056004524231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,balanced,0.3053013285001119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,8,32,power_law_1.2,0.06736000180244446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,power_law_1.01,0.3647615909576416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,8,32,power_law_1.2,0.07345280051231384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,balanced,1.0964372952779133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,power_law_1.01,0.40259838104248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,8,32,power_law_1.2,0.09082239866256714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,8,32,power_law_1.2,0.11317119598388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,8,32,power_law_1.2,0.13661439418792726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,power_law_1.01,0.5422783851623535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,8,32,power_law_1.2,0.18341759443283082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,8,32,power_law_1.2,0.26841599941253663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,8,32,power_law_1.2,0.35290238857269285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,power_law_1.01,0.8809663772583007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,8,32,power_law_1.2,0.6153408050537109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,power_law_1.01,1.0195327758789063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,balanced,0.3736960093180339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,8,32,power_law_1.2,0.6123136043548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,power_law_1.01,1.5295488357543945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,8,32,power_law_1.2,0.7591423988342285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,8,32,power_law_1.2,1.3107328414916992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,power_law_1.01,2.7878976821899415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,8,32,power_law_1.2,3.645471954345703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,balanced,0.5776106516520182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,8,32,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,8,32,power_law_1.2,0.032390400767326355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,8,32,power_law_1.2,0.03219839930534363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,8,32,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,8,32,power_law_1.2,0.03470720052719116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,8,32,power_law_1.2,0.03858560025691986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,balanced,0.039450667798519135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,8,32,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,balanced,0.03336533407370249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,8,32,power_law_1.2,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,balanced,0.03404266635576884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,8,32,power_law_1.2,0.03891839981079102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,balanced,0.036848001182079315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,8,32,power_law_1.2,0.037990400195121767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,4096,1536,8,128,8,32,power_law_1.2,0.02863360047340393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,balanced,0.036757332583268486
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,8,32,power_law_1.2,0.04195840060710907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,balanced,0.03809600075085958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,4096,1536,8,128,8,32,power_law_1.2,0.026572799682617186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,8,32,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,balanced,0.040063999593257904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,4096,1536,8,128,8,32,power_law_1.2,0.026815998554229736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,8,32,power_law_1.2,0.04333440065383911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,balanced,0.03869866579771042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,4096,1536,8,128,8,32,power_law_1.2,0.029100799560546876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,8,32,power_law_1.2,0.04291839897632599
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,balanced,0.038032000263532005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,4096,1536,8,128,8,32,power_law_1.2,0.02974080145359039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,8,32,power_law_1.2,0.04630399942398071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,4096,1536,8,128,8,32,power_law_1.2,0.031014400720596313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,balanced,0.04055999964475632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,8,32,power_law_1.2,0.04936319887638092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,4096,1536,8,128,8,32,power_law_1.2,0.031225600838661195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,8,32,power_law_1.2,0.05348479747772217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,balanced,0.04099733382463455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,4096,1536,8,128,8,32,power_law_1.2,0.032416000962257385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,8,32,power_law_1.2,0.06236159801483154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,balanced,0.03978666663169861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,4096,1536,8,128,8,32,power_law_1.2,0.03336319923400879
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,8,32,power_law_1.2,0.07418879866600037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,balanced,1.113381306330363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,balanced,0.039834665755430855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,4096,1536,8,128,8,32,power_law_1.2,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,8,32,power_law_1.2,0.09048320055007934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,balanced,0.04388799766699473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,4096,1536,8,128,8,32,power_law_1.2,0.034643200039863584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,8,32,power_law_1.2,0.12005120515823364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,4096,1536,8,128,8,32,power_law_1.2,0.03803519904613495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,balanced,0.04387733340263367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,8,32,power_law_1.2,0.16095999479293824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,4096,1536,8,128,8,32,power_law_1.2,0.03837440013885498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,balanced,0.04956266780694326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,8,32,power_law_1.2,0.19092479944229127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,4096,1536,8,128,8,32,power_law_1.2,0.04136320054531097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,balanced,0.05133866767088572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,8,32,power_law_1.2,0.2782144069671631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,balanced,0.055573334296544395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,8,32,power_law_1.2,0.3553087949752808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,4096,1536,8,128,8,32,power_law_1.2,0.044627198576927186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,8,32,power_law_1.2,0.6376512050628662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,balanced,0.055061335364977516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,4096,1536,8,128,8,32,power_law_1.2,0.04595839977264404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,8,32,power_law_1.2,0.7031424045562744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,balanced,0.06069866816202799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,8,32,power_law_1.2,0.9820992469787597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,4096,1536,8,128,8,32,power_law_1.2,0.05813760161399841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,balanced,0.07020799815654755
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,8,32,power_law_1.2,1.7939712524414062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,4096,1536,8,128,8,32,power_law_1.2,0.0680512011051178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,4096,1536,8,128,8,32,power_law_1.2,0.08920320272445678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,balanced,0.032405334214369454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,8,32,power_law_1.2,2.9499263763427734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,balanced,0.0801333338022232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,balanced,0.03188266605138779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,balanced,0.03275733441114426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,4096,1536,8,128,8,32,power_law_1.2,0.12908159494400023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,balanced,0.03521066655715307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,balanced,0.08991466959317525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,balanced,0.03653866549332937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,4096,1536,8,128,8,32,power_law_1.2,0.13345919847488402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,balanced,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,balanced,0.03940266619126002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,balanced,0.039306665460268654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,4096,1536,8,128,8,32,power_law_1.2,0.2619136095046997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,balanced,0.039477333426475525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,balanced,0.12377599875132243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,balanced,0.0402453343073527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,4096,1536,8,128,8,32,power_law_1.2,0.4349247932434082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,balanced,0.04026666780312856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,balanced,0.040421334405740104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,4096,1536,8,128,8,32,power_law_1.2,0.4401088237762451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,balanced,0.04257600009441376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,balanced,0.04260799785455068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,balanced,0.04462933540344238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,balanced,0.14618133505185446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,4096,1536,8,128,8,32,power_law_1.2,0.5343616008758545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,balanced,0.044735997915267944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,balanced,0.04771199822425842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,4096,1536,8,128,8,32,power_law_1.2,0.9021439552307129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,balanced,0.05261866748332977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,balanced,0.05729599793752035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,4096,1536,8,128,8,32,power_law_1.2,1.369331169128418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,balanced,0.07096533477306366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,balanced,0.21095999081929526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,4096,1536,8,128,8,32,power_law_1.2,2.12108154296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,balanced,0.08406399687131245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,4096,1536,8,128,8,32,power_law_1.2,3.258252716064453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,balanced,0.1037493348121643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,4096,1536,8,128,8,32,power_law_1.2,5.459302520751953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,balanced,0.12009599804878235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.01,0.03984639942646027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.01,0.047391998767852786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.01,0.03315199911594391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,balanced,0.27164800961812335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.01,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,balanced,0.16664533813794455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.01,0.03403519988059998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.01,0.034771201014518735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.01,0.03379839956760407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.01,0.03617919981479645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.01,0.03576320111751556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.01,0.03813759982585907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.01,0.03707520067691803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.01,0.038176000118255615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,balanced,0.2046453356742859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.01,0.038099199533462524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.01,0.03878400027751923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.01,0.03878400027751923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.01,0.038515201210975646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.01,0.039110401272773744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.01,0.04016000032424927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.01,0.03960959911346436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.01,0.04140160083770752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,balanced,0.3213493426640828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.01,0.04535039961338043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.01,0.04089600145816803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.01,0.04759680032730103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.01,0.04206080138683319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.01,0.048979198932647704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,balanced,0.29764266808827716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.01,0.04392960071563721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.01,0.051526397466659546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.01,0.04598399996757507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.01,0.05489280223846436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.01,0.048563200235366824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.01,0.05740159749984741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.01,0.05311999917030334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.01,0.06498559713363647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.01,0.055820798873901366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.01,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.01,0.06972159743309021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.01,0.06515200138092041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.01,0.08643199801445008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,balanced,0.38523733615875244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.01,0.07196159958839417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.01,0.09292799830436707
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.01,0.12643200159072876
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.01,0.09277439713478089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.01,0.15788160562515258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.01,0.10454399585723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.01,0.19661439657211305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.01,0.1390720009803772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.01,0.24625918865203858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,balanced,0.44993066787719727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.01,0.175545597076416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.01,0.4230720043182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.01,0.548851203918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.01,0.23322880268096924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.01,0.5844416141510009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.01,0.30680320262908933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.01,0.877894401550293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.01,0.47757439613342284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,balanced,0.4686986605326335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.01,1.774630355834961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.01,0.5676095962524415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.01,0.7779263973236084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.01,1.2823871612548827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.01,2.3924543380737306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,balanced,0.7015573183695475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,balanced,0.8735093275705973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,16,16,power_law_1.2,0.04625920057296753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,16,16,power_law_1.2,0.03412480056285858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,16,16,power_law_1.2,0.03505919873714447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,16,16,power_law_1.2,0.03612160086631775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,16,16,power_law_1.2,0.036800000071525577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,16,16,power_law_1.2,0.03860479891300202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,16,16,power_law_1.2,0.038150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,16,16,power_law_1.2,0.0400191992521286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,16,16,power_law_1.2,0.03961600065231323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,16,16,power_law_1.2,0.04270080029964447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,16,16,power_law_1.2,0.04575999975204468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,16,16,power_law_1.2,0.04744960069656372
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,16,16,power_law_1.2,0.04758400022983551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,16,16,power_law_1.2,0.05151360034942627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,16,16,power_law_1.2,0.05431680083274841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,balanced,1.3868160247802734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,16,16,power_law_1.2,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,16,16,power_law_1.2,0.06741759777069092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,16,16,power_law_1.2,0.07516800165176392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,16,16,power_law_1.2,0.07564160227775574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,16,16,power_law_1.2,0.10138880014419556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,16,16,power_law_1.2,0.10670720338821411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,16,16,power_law_1.2,0.17153919935226442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,16,16,power_law_1.2,0.03885439932346344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,16,16,power_law_1.2,0.1772096037864685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,16,16,power_law_1.2,0.2784575939178467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,16,16,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,16,16,power_law_1.2,0.347871994972229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,16,16,power_law_1.2,0.03224320113658905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,16,16,power_law_1.2,0.47759361267089845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,16,16,power_law_1.2,0.03404799997806549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,16,16,power_law_1.2,0.6397632122039795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,16,16,power_law_1.2,0.03573760092258453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,16,16,power_law_1.2,1.0149120330810546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,16,16,power_law_1.2,0.038150399923324585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,16,16,power_law_1.2,0.03830400109291077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,16,16,power_law_1.2,0.03914879858493805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,16,16,power_law_1.2,1.4691200256347656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,16,16,power_law_1.2,0.039392000436782836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,16,16,power_law_1.2,0.03985919952392578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,16,16,power_law_1.2,3.299020767211914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,16,16,power_law_1.2,0.04256640076637268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,16,16,power_law_1.2,0.04337919950485229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,16,16,power_law_1.2,0.04417920112609863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,16,16,power_law_1.2,0.04709759950637817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,16,16,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,16,16,power_law_1.2,0.05429760217666626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,16,16,power_law_1.2,0.056358402967453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,16,16,power_law_1.2,0.06487680077552796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,16,16,power_law_1.2,0.07397119998931885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,16,16,power_law_1.2,0.09800320267677307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,16,16,power_law_1.2,0.11781120300292969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,16,16,power_law_1.2,0.14670079946517944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,16,16,power_law_1.2,0.18614399433135986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,16,16,power_law_1.2,0.287558388710022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,16,16,power_law_1.2,0.36943359375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,16,16,power_law_1.2,0.5736127853393554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,16,16,power_law_1.2,0.7788479804992676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,16,16,power_law_1.2,1.0714240074157715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,16,16,power_law_1.2,1.56494083404541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,balanced,0.032730666299661
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,balanced,0.0351946676770846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,16,16,power_law_1.2,4.132006454467773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,balanced,0.032469332218170166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,balanced,0.03396799912055334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,balanced,0.03348266581694285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,balanced,0.03392533212900162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,balanced,0.036117332677046456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,balanced,0.04517866671085358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,balanced,0.04649066428343455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,balanced,0.05009066561857859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,balanced,0.04683733483155569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,balanced,0.04680533210436503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,balanced,0.040576001008351646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,balanced,0.04682666560014089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,balanced,0.04125866790612539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,balanced,0.04744000236193339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,balanced,0.04035733391841253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,balanced,0.047797332207361855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,balanced,0.04072533299525579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,balanced,0.04820266862710317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,balanced,0.04907733201980591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,balanced,0.04081599911053976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,balanced,0.050026665131251015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,balanced,0.049866666396458946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,balanced,0.05064000189304352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,balanced,0.04186666508515676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,balanced,0.05050133168697357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,balanced,0.05994133154551188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,balanced,0.04699199895064036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,balanced,0.06355200211207072
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,balanced,0.05080533524354299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,balanced,0.06624533236026764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,balanced,0.06669333577156067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,balanced,0.06258133550484975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,balanced,0.081535999973615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,balanced,0.06718933085600536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,balanced,0.09330133597056071
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,balanced,0.07765333354473114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,balanced,0.12692266702651978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,balanced,0.09233066439628601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,balanced,0.1239520013332367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,balanced,0.15042666594187418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,balanced,0.12270399928092957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,balanced,0.22078933318456015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,balanced,0.17163733641306558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,balanced,0.2810080051422119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,balanced,0.22374399503072104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.01,0.0394239991903305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.01,0.03678719997406006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,balanced,0.4103200038274129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.01,0.03949440121650696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,balanced,0.32229334115982056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.01,0.047366398572921756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.01,0.04170880019664765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.01,0.042361599206924436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.01,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.01,0.042099198698997496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.01,0.04275839924812317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.01,0.04933759868144989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.01,0.033542400598526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.01,0.0361407995223999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.01,0.049516800045967105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.01,0.039084801077842714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.01,0.05211520195007324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,balanced,0.5111306508382162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,balanced,0.4500799973805745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.01,0.0456959992647171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.01,0.05711359977722168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.01,0.061990398168563846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.01,0.046412798762321475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.01,0.06481279730796814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.01,0.04624640047550201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.01,0.07120640277862549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.01,0.04752640128135681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.01,0.08019199967384338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.01,0.04965119957923889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.01,0.08214399814605713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.01,0.05084159970283508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.01,0.09542400240898133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.01,0.05203199982643127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.01,0.11663360595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.01,0.05413119792938233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.01,0.1468287944793701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.01,0.05665919780731201
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.01,0.1641152024269104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,balanced,0.6366560061772665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.01,0.059552001953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.01,0.2549312114715576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,balanced,0.5727680126825968
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.01,0.06808320283889771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.01,0.33264639377593996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.01,0.07442560195922851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.01,0.4553664207458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.01,0.08136320114135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.01,0.6682112216949463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.01,0.10615040063858032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.01,0.8455103874206543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.01,0.12016639709472657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.01,0.1690816044807434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.01,1.2091456413269044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.01,0.21516799926757812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.01,2.7558656692504884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.01,0.3043839931488037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.01,0.3616767883300781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.01,0.5843776226043701
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.01,0.8172991752624512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.01,0.8934528350830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.01,1.587782382965088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,balanced,0.9999679724375407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.01,3.333235168457031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,balanced,0.863264004389445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,4096,1536,8,128,32,8,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,4096,1536,8,128,32,8,power_law_1.2,0.03408640027046204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,4096,1536,8,128,32,8,power_law_1.2,0.03500159978866577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,4096,1536,8,128,32,8,power_law_1.2,0.03702400028705597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,4096,1536,8,128,32,8,power_law_1.2,0.03761279881000519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,4096,1536,8,128,32,8,power_law_1.2,0.04892799854278564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,4096,1536,8,128,32,8,power_law_1.2,0.041657599806785586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,4096,1536,8,128,32,8,power_law_1.2,0.042508798837661746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,4096,1536,8,128,32,8,power_law_1.2,0.0420415997505188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,4096,1536,8,128,32,8,power_law_1.2,0.04469760060310364
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,4096,1536,8,128,32,8,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,4096,1536,8,128,32,8,power_law_1.2,0.051520001888275144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,4096,1536,8,128,32,8,power_law_1.2,0.051475197076797485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,4096,1536,8,128,32,8,power_law_1.2,0.05620480179786682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,4096,1536,8,128,32,8,power_law_1.2,0.06245120167732239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,4096,1536,8,128,32,8,power_law_1.2,0.03607040047645569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,4096,1536,8,128,32,8,power_law_1.2,0.06453120112419128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,4096,1536,8,128,32,8,power_law_1.2,0.03253119885921478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,4096,1536,8,128,32,8,power_law_1.2,0.07297279834747314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,balanced,1.9617813428243
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,4096,1536,8,128,32,8,power_law_1.2,0.0326335996389389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,balanced,1.6825599670410156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,4096,1536,8,128,32,8,power_law_1.2,0.0809664011001587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,4096,1536,8,128,32,8,power_law_1.2,0.03633280098438263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,4096,1536,8,128,32,8,power_law_1.2,0.08744320273399353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,4096,1536,8,128,32,8,power_law_1.2,0.10890239477157593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,4096,1536,8,128,32,8,power_law_1.2,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,4096,1536,8,128,32,8,power_law_1.2,0.040556800365447995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,4096,1536,8,128,32,8,power_law_1.2,0.1295232057571411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,4096,1536,8,128,32,8,power_law_1.2,0.04423039853572845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,4096,1536,8,128,32,8,power_law_1.2,0.15858559608459472
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,4096,1536,8,128,32,8,power_law_1.2,0.046438398957252505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,4096,1536,8,128,32,8,power_law_1.2,0.19833600521087646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,4096,1536,8,128,32,8,power_law_1.2,0.04705919921398163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,4096,1536,8,128,32,8,power_law_1.2,0.29300479888916015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,4096,1536,8,128,32,8,power_law_1.2,0.0484607994556427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,4096,1536,8,128,32,8,power_law_1.2,0.3553087949752808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,4096,1536,8,128,32,8,power_law_1.2,0.04863359928131104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,4096,1536,8,128,32,8,power_law_1.2,0.7033535957336425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,4096,1536,8,128,32,8,power_law_1.2,0.050944000482559204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,4096,1536,8,128,32,8,power_law_1.2,0.9257599830627441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,4096,1536,8,128,32,8,power_law_1.2,0.05279359817504883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,4096,1536,8,128,32,8,power_law_1.2,0.053395199775695804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,4096,1536,8,128,32,8,power_law_1.2,1.0306559562683106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,4096,1536,8,128,32,8,power_law_1.2,0.0580735981464386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,4096,1536,8,128,32,8,power_law_1.2,1.8275840759277344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,4096,1536,8,128,32,8,power_law_1.2,0.06058239936828613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,4096,1536,8,128,32,8,power_law_1.2,0.06940799951553345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,4096,1536,8,128,32,8,power_law_1.2,4.086470413208008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,4096,1536,8,128,32,8,power_law_1.2,0.0781823992729187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,4096,1536,8,128,32,8,power_law_1.2,0.08553599715232849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,4096,1536,8,128,32,8,power_law_1.2,0.11327999830245972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,4096,1536,8,128,32,8,power_law_1.2,0.13458559513092042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,4096,1536,8,128,32,8,power_law_1.2,0.19523839950561522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,4096,1536,8,128,32,8,power_law_1.2,0.21957759857177733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,4096,1536,8,128,32,8,power_law_1.2,0.31189119815826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,4096,1536,8,128,32,8,power_law_1.2,0.44202241897583006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,4096,1536,8,128,32,8,power_law_1.2,0.6837376117706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,4096,1536,8,128,32,8,power_law_1.2,0.8920255661010742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,4096,1536,8,128,32,8,power_law_1.2,1.0956543922424316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,4096,1536,8,128,32,8,power_law_1.2,1.8059839248657226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,4096,1536,8,128,32,8,power_law_1.2,4.296377563476563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,balanced,0.05087466537952423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,balanced,0.05163733164469401
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,balanced,0.052042668064435325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,balanced,0.0561653325955073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,balanced,0.07162666817506154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,balanced,0.07234133283297221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,balanced,0.07258133093516032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,balanced,0.07354133327802022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,balanced,0.07436800003051758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,balanced,0.046538665890693665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,balanced,0.07381333410739899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,balanced,0.04663999875386556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,balanced,0.07361066838105519
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,balanced,0.07425599793593089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,balanced,0.04663999875386556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,balanced,0.050341332952181496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,balanced,0.07450133562088013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,balanced,0.05415999889373779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,balanced,0.07496533294518788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,balanced,0.057071998715400696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,balanced,0.07762133578459422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,balanced,0.058362667759259544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,balanced,0.07842133442560832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,balanced,0.05904000004132589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,balanced,0.07947200040022533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,balanced,0.05936533212661743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,balanced,0.057258665561676025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,balanced,0.0869760016600291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,balanced,0.060090666015942894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,balanced,0.090037335952123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,balanced,0.061893333991368614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,balanced,0.10361066460609436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,balanced,0.06217066446940104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,balanced,0.06550933420658112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,balanced,0.10970667004585266
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,balanced,0.07017600039641063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,balanced,0.0728053351243337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,balanced,0.13265066345532736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,balanced,0.07645333309968312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,balanced,0.04151466737190882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,balanced,0.08711466193199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,balanced,0.04204800228277842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,balanced,0.15081066886583963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,balanced,0.04218666752179464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,balanced,0.09311999877293904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,balanced,0.04500266909599304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,balanced,0.11496000488599141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,balanced,0.04907733201980591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,balanced,0.050399998823801674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.01,0.07288320064544677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,balanced,0.19446400801340738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.01,0.061388802528381345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,balanced,0.052005335688591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,balanced,0.1253546675046285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.01,0.06791039705276489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.01,0.05400320291519165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,balanced,0.05250666538874308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.01,0.06342399716377259
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,balanced,0.052239999175071716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.01,0.04813440144062042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.01,0.07121279835700989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,balanced,0.15889066457748413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.01,0.06955519914627076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,balanced,0.05309866865475973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.01,0.0529151976108551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,balanced,0.2400053342183431
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.01,0.07157760262489318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,balanced,0.0554720014333725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.01,0.052262401580810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,balanced,0.18825600544611612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,balanced,0.05594133337338766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.01,0.07279360294342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.01,0.055776000022888184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.01,0.07643520236015319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,balanced,0.05729066828886668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.01,0.05745279788970947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.01,0.07927680015563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,balanced,0.060122668743133545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.01,0.057171201705932616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.01,0.07203840017318726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,balanced,0.25512532393137616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,balanced,0.0631573349237442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.01,0.07833600044250488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.01,0.05971840023994446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.01,0.07698559761047363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,balanced,0.32387733459472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.01,0.06037120223045349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.01,0.08174719810485839
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.01,0.06229119896888733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.01,0.08950399756431579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,balanced,0.06917333106199901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.01,0.09759359955787658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.01,0.06410880088806152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.01,0.08643839955329895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.01,0.06795520186424256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,balanced,0.3257333238919576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.01,0.1094208002090454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.01,0.0699072003364563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,balanced,0.07195200026035309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.01,0.11944320201873779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.01,0.0775168001651764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.01,0.15665919780731202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.01,0.08053759932518005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.01,0.1521407961845398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.01,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.01,0.2197567939758301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.01,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,balanced,0.40990400314331055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.01,0.28378241062164306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.01,0.12048640251159667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.01,0.3316927909851074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,balanced,0.07960533102353413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,balanced,0.4527680079142253
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.01,0.14442239999771117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.01,0.40456318855285645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.01,0.15367039442062377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,balanced,0.08796800176302592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.01,0.6244736194610596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.01,0.21123840808868408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.01,0.8978176116943359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.01,0.2502784013748169
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.01,0.9827520370483398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.01,0.365721607208252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.01,0.42801918983459475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.01,1.5033791542053223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.01,0.6615935802459717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,balanced,0.10294933120409648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.01,2.979827117919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,power_law_1.01,0.04857600033283234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.01,0.8605440139770508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,balanced,0.5771413246790568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,balanced,0.48236799240112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,balanced,0.11664533615112305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.01,1.2133312225341797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,power_law_1.01,0.045311999320983884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,power_law_1.01,0.042771199345588685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.01,1.7636159896850585
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,power_law_1.01,0.04859519898891449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.01,3.5964481353759767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,power_law_1.01,0.0487744003534317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,balanced,0.1498186687628428
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,power_law_1.01,0.051660799980163576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,power_law_1.01,0.05245440006256104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,balanced,0.17659733692804971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,power_law_1.01,0.05617280006408691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,8,32,power_law_1.2,0.07264639735221863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,balanced,0.7008266448974609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,power_law_1.01,0.05731199979782105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,8,32,power_law_1.2,0.06035839915275574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,power_law_1.01,0.060012799501419065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,8,32,power_law_1.2,0.05625600218772888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,power_law_1.01,0.06261759996414185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,power_law_1.01,0.06405119895935059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,8,32,power_law_1.2,0.061977601051330565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,balanced,0.23915199438730875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,power_law_1.01,0.06899840235710145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,8,32,power_law_1.2,0.06848000288009644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,balanced,0.7649760246276855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,power_law_1.01,0.07452800273895263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,8,32,power_law_1.2,0.069651198387146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,8,32,power_law_1.2,0.07104640007019043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,power_law_1.01,0.07971199750900268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,8,32,power_law_1.2,0.0720575988292694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,8,32,power_law_1.2,0.07868160009384155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,power_law_1.01,0.0911616027355194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,8,32,power_law_1.2,0.08012160062789916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,balanced,0.315226674079895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,8,32,power_law_1.2,0.07609599828720093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,power_law_1.01,0.09797760248184204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,8,32,power_law_1.2,0.07679359912872315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,8,32,power_law_1.2,0.07824640274047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,power_law_1.01,0.12035839557647705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,balanced,1.1065066655476887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,8,32,power_law_1.2,0.08499839901924133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,8,32,power_law_1.2,0.10089600086212158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,balanced,0.4476426839828491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,power_law_1.01,0.1549183964729309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,8,32,power_law_1.2,0.10264320373535156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,8,32,power_law_1.2,0.09293439984321594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,power_law_1.01,0.18976000547409058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,8,32,power_law_1.2,0.11699839830398559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,8,32,power_law_1.2,0.06384000182151794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,8,32,power_law_1.2,0.13216639757156373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,power_law_1.01,0.2533440113067627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,8,32,power_law_1.2,0.18434560298919678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,8,32,power_law_1.2,0.05002239942550659
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,power_law_1.01,0.33301119804382323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,8,32,power_law_1.2,0.1775871992111206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,8,32,power_law_1.2,0.04926080107688904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,8,32,power_law_1.2,0.05281919836997986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,8,32,power_law_1.2,0.24879999160766603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,power_law_1.01,0.4494463920593262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,8,32,power_law_1.2,0.054176002740859985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,8,32,power_law_1.2,0.28653440475463865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,8,32,power_law_1.2,0.054585599899291994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,power_law_1.01,0.6828415870666504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,balanced,0.5912799835205078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,8,32,power_law_1.2,0.05575680136680603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,power_law_1.01,0.9309823989868165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,8,32,power_law_1.2,0.51943039894104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,8,32,power_law_1.2,0.057043200731277464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,8,32,power_law_1.2,0.05982080101966858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,power_law_1.01,1.2072064399719238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,8,32,power_law_1.2,0.5793407917022705
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,8,32,power_law_1.2,0.06119040250778198
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,power_law_1.01,1.618783950805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,8,32,power_law_1.2,0.0627839982509613
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,8,32,power_law_1.2,0.8440896034240722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,8,32,power_law_1.2,0.06567680239677429
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,power_law_1.01,2.5433664321899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,balanced,1.4591946601867676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,8,32,power_law_1.2,1.1325056076049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,8,32,power_law_1.2,0.07040640115737914
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,power_law_1.01,5.35269775390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,8,32,power_law_1.2,0.07260800004005433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,8,32,power_law_1.2,1.3502207756042481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,balanced,0.7184586524963379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,8,32,power_law_1.2,0.082259202003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,8,32,power_law_1.2,0.09285119771957398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,8,32,power_law_1.2,2.3194559097290037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,8,32,power_law_1.2,0.08715519905090333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,8,32,power_law_1.2,0.10583679676055908
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,8,32,power_law_1.2,5.204601669311524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,8,32,power_law_1.2,0.1251711964607239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,balanced,2.204517364501953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,8,32,power_law_1.2,0.15771520137786865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,8,32,power_law_1.2,0.17847039699554443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,8,32,power_law_1.2,0.2617216110229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,8,32,power_law_1.2,0.29399681091308594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,8,32,power_law_1.2,0.43683199882507323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,8,32,power_law_1.2,0.548748779296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,8,32,power_law_1.2,0.8255871772766114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,8,32,power_law_1.2,1.1598272323608398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,balanced,1.1159199873606365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,8,32,power_law_1.2,1.3408960342407226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,8,32,power_law_1.2,2.446323204040527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,8,32,power_law_1.2,5.768390274047851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,balanced,0.0518453319867452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,balanced,0.05133866767088572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,balanced,0.052602668603261314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,balanced,0.05477866530418396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,8,32,power_law_1.2,0.04862079918384552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,balanced,0.07030933101971944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,balanced,0.07214400172233582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,balanced,2.197546641031901
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,8,32,power_law_1.2,0.04398080110549927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,balanced,0.07318399846553802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,8,32,power_law_1.2,0.04261119961738587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,balanced,0.07597866654396057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,8,32,power_law_1.2,0.04656639993190766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,balanced,0.07445333401362102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,balanced,0.0757120003302892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,8,32,power_law_1.2,0.04927360117435455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,balanced,0.07587199906508128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,8,32,power_law_1.2,0.05102720260620117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,balanced,0.07649066547552745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,balanced,0.07724800209204356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,8,32,power_law_1.2,0.05063040256500244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,balanced,0.07955733438332875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,8,32,power_law_1.2,0.052083200216293334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,balanced,0.08303466439247131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,8,32,power_law_1.2,0.05743359923362732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,balanced,0.08449600140253703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,8,32,power_law_1.2,0.058719998598098753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,balanced,0.08649067083994548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,8,32,power_law_1.2,0.06074240207672119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,balanced,0.10340799887975057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,8,32,power_law_1.2,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,balanced,0.09571199615796407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,8,32,power_law_1.2,0.06592640280723572
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,balanced,0.12623467048009238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,8,32,power_law_1.2,0.07015039920806884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,8,32,power_law_1.2,0.07890560030937195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,balanced,0.12095466256141663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,8,32,power_law_1.2,0.0858240008354187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,balanced,0.16562666495641074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,8,32,power_law_1.2,0.0920639991760254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,balanced,0.17867734034856161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,8,32,power_law_1.2,0.10632959604263306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,8,32,power_law_1.2,0.12247680425643921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,balanced,0.25387199719746906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,8,32,power_law_1.2,0.17758079767227172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,8,32,power_law_1.2,0.22167038917541504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,8,32,power_law_1.2,0.3382591962814331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,balanced,0.3057386676470439
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,8,32,power_law_1.2,0.3840895891189575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,8,32,power_law_1.2,0.5815104007720947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,balanced,0.046570668617884316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,8,32,power_law_1.2,0.9395839691162109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,balanced,0.0469706654548645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,balanced,0.43271466096242267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,8,32,power_law_1.2,1.1516032218933105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,balanced,0.04722133278846741
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,8,32,power_law_1.2,1.7964351654052735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,balanced,0.0533493310213089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,balanced,0.05698133508364359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,8,32,power_law_1.2,2.544211196899414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,balanced,0.058874666690826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,8,32,power_law_1.2,4.679891204833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,balanced,0.06065066655476888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.01,0.08206080198287964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,balanced,0.510042667388916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,8,32,power_law_1.2,8.814514923095704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,balanced,0.060736000537872314
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.01,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,balanced,0.060778667529424034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.01,0.05333120226860046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,balanced,0.06309866905212402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.01,0.06252800226211548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,balanced,0.06311999758084615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,balanced,0.04193066557248434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.01,0.06728960275650024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,balanced,0.06346666812896729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,balanced,0.042591998974482216
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.01,0.07067520022392274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.01,0.06175360083580017
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,balanced,0.06461333235104878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,balanced,0.04333333174387614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.01,0.0716543972492218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,balanced,0.04711466530958811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,balanced,0.06842666864395142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.01,0.06004480123519897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,balanced,0.050586665670077004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.01,0.075135999917984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,balanced,0.6031359831492106
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.01,0.04856959879398346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,balanced,0.07569600145022075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,balanced,0.055018668373425804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.01,0.07736960053443909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.01,0.05617920160293579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,balanced,0.07740800082683563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,balanced,0.05555200080076853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.01,0.07656959891319275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.01,0.05644800066947937
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,balanced,0.05552533268928528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,balanced,0.08081600069999695
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.01,0.0585919976234436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,balanced,0.057573333382606506
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.01,0.080595201253891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,balanced,0.09783466657002766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.01,0.05991680026054382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,balanced,0.05782933533191681
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.01,0.08036479949951172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.01,0.05983999967575073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,balanced,0.05900266766548157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,balanced,0.0990666647752126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,balanced,0.0609493354956309
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.01,0.06220800280570984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.01,0.0832319974899292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,power_law_1.01,0.0521664023399353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,balanced,0.12659200032552084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.01,0.06343039870262146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.01,0.08535680174827576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,balanced,0.06532800197601318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,power_law_1.01,0.05195519924163818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.01,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.01,0.08978559970855712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,power_law_1.01,0.04529280066490173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,balanced,0.13446399569511414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,balanced,0.0690719981988271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.01,0.0713536024093628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.01,0.09602559804916382
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,power_law_1.01,0.05134080052375793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.01,0.07255679965019227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,power_law_1.01,0.05233280062675476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.01,0.10207359790802002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,balanced,0.1827626625696818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.01,0.0732479989528656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,power_law_1.01,0.05622400045394897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,balanced,0.07473599910736084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,power_law_1.01,0.05678719878196716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.01,0.12110079526901245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.01,0.08108800053596496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,balanced,0.9698346455891927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,power_law_1.01,0.05793920159339905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.01,0.13646080493927001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.01,0.08391039967536926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,power_law_1.01,0.06058880090713501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,balanced,0.2135093410809835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,balanced,0.08040000001589458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,power_law_1.01,0.06212480068206787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.01,0.17662719488143921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.01,0.0916159987449646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,power_law_1.01,0.0652288019657135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.01,0.17511680126190185
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.01,0.10848000049591064
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,power_law_1.01,0.06640639901161194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,power_law_1.01,0.06952959895133973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.01,0.23909759521484375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.01,0.12157440185546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,balanced,0.29808000723520917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,power_law_1.01,0.07605119943618774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.01,0.2746495962142944
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.01,0.15444480180740355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,power_law_1.01,0.08618239760398864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,balanced,0.0904906690120697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.01,0.38458240032196045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.01,0.1729151964187622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,balanced,0.10042666395505269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,power_law_1.01,0.08859519958496094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.01,0.22811520099639893
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.01,0.4541312217712402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.01,0.2781440019607544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,balanced,0.3734560012817383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,power_law_1.01,0.0944703996181488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.01,0.663040018081665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.01,0.38042240142822265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.01,0.7711103916168213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.01,0.5253312110900878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,power_law_1.01,0.11637760400772094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,balanced,0.12133333086967468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.01,1.0432703971862793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,power_law_1.01,0.12670079469680787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.01,0.7718912124633789
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,16,16,power_law_1.2,0.0812991976737976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.01,1.575603199005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,balanced,0.14009066422780356
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,16,16,power_law_1.2,0.05858560204505921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.01,0.9533247947692871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,balanced,0.5449066559473673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,16,16,power_law_1.2,0.05303679704666138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,power_law_1.01,0.17333760261535644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.01,1.1828672409057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.01,3.133535957336426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,16,16,power_law_1.2,0.05848960280418396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,power_law_1.01,0.23418879508972168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.01,1.8206527709960938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,16,16,power_law_1.2,0.06564480066299438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,balanced,0.19133333365122476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,power_law_1.01,0.32515199184417726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,16,16,power_law_1.2,0.07010560035705567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,power_law_1.01,0.3937599897384644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.01,3.9907711029052733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,16,16,power_law_1.2,0.07185919880867005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,16,16,power_law_1.2,0.07427840232849121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,balanced,0.24380266666412354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,16,16,power_law_1.2,0.07671040296554565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,power_law_1.01,0.5781568050384521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,balanced,0.66866135597229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,16,16,power_law_1.2,0.0753920018672943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,power_law_1.01,0.7542719841003418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,16,16,power_law_1.2,0.07963520288467407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,balanced,0.3474613428115845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,16,16,power_law_1.2,0.0843775987625122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,16,16,power_law_1.2,0.0837119996547699
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,power_law_1.01,1.1444607734680177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,balanced,1.8736534118652344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,16,16,power_law_1.2,0.08872320055961609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,power_law_1.01,1.6009792327880858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,16,16,power_law_1.2,0.09326720237731934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,balanced,0.4468160072962443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,power_law_1.01,1.9633920669555665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,16,16,power_law_1.2,0.09516159892082214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,16,16,power_law_1.2,0.10891519784927368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,power_law_1.01,3.2927616119384764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,balanced,0.8167146841684977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,16,16,power_law_1.2,0.14154239892959594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,16,16,power_law_1.2,0.1468160033226013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,power_law_1.01,6.162432098388672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,16,16,power_law_1.2,0.1941248059272766
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,16,16,power_law_1.2,0.1956287980079651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,16,16,power_law_1.2,0.2855423927307129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,balanced,0.6414026816685995
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,16,16,power_law_1.2,0.28631041049957273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,16,16,power_law_1.2,0.4448703765869141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,16,16,power_law_1.2,0.5131392002105712
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,16,16,power_law_1.2,0.9323200225830078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,16,16,power_law_1.2,1.0686335563659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,16,16,power_law_1.2,1.4573760032653809
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,balanced,0.8295520146687826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,16,16,power_law_1.2,2.475289535522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,balanced,1.2980159918467205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,16,16,power_law_1.2,5.880031967163086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,balanced,1.0092106660207112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,16,16,power_law_1.2,0.06160640120506287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,16,16,power_law_1.2,0.04940800070762634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,16,16,power_law_1.2,0.048390400409698484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,16,16,power_law_1.2,0.05541120171546936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,16,16,power_law_1.2,0.05494400262832642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,16,16,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,16,16,power_law_1.2,0.06033279895782471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,16,16,power_law_1.2,0.0611840009689331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,balanced,1.588538646697998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,16,16,power_law_1.2,0.0636031985282898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,16,16,power_law_1.2,0.06550400257110596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,16,16,power_law_1.2,0.0666815996170044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,16,16,power_law_1.2,0.07125120162963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,16,16,power_law_1.2,0.07438719868659974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,16,16,power_law_1.2,0.07579519748687744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,16,16,power_law_1.2,0.07922559976577759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,balanced,2.559109369913737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,16,16,power_law_1.2,0.08514559864997864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,16,16,power_law_1.2,0.0955136001110077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,16,16,power_law_1.2,0.1123136043548584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,16,16,power_law_1.2,0.13271039724349976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,16,16,power_law_1.2,0.16682239770889282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,16,16,power_law_1.2,0.18933119773864746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,16,16,power_law_1.2,0.24683520793914795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,16,16,power_law_1.2,0.312556791305542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,16,16,power_law_1.2,0.4551231861114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,16,16,power_law_1.2,0.5853439807891846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,16,16,power_law_1.2,0.8493760108947754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,16,16,power_law_1.2,1.1415103912353515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,16,16,power_law_1.2,1.4732416152954102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,16,16,power_law_1.2,2.306713676452637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,16,16,power_law_1.2,5.1799358367919925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,balanced,3.1508267720540366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,balanced,0.05249066650867462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,balanced,0.052239999175071716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,balanced,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,balanced,0.0569706658522288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,6144,2560,8,160,16,16,power_law_1.2,0.05200639963150024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,balanced,0.0737120012442271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,balanced,0.07810133198897044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,6144,2560,8,160,16,16,power_law_1.2,0.04437119960784912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,balanced,0.07844799757003784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,6144,2560,8,160,16,16,power_law_1.2,0.0451200008392334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,balanced,0.04668800036112467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,balanced,0.08012799918651581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,6144,2560,8,160,16,16,power_law_1.2,0.04785279929637909
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,balanced,0.08004799981911977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,balanced,0.04719999929269155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,6144,2560,8,160,16,16,power_law_1.2,0.050496000051498416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,balanced,0.08032000064849854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,balanced,0.04907733201980591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,6144,2560,8,160,16,16,power_law_1.2,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,balanced,0.08111999928951263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,6144,2560,8,160,16,16,power_law_1.2,0.05761280059814453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,balanced,0.05317866802215576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,6144,2560,8,160,16,16,power_law_1.2,0.059545600414276124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,balanced,0.0817493349313736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,balanced,0.06091199815273285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,6144,2560,8,160,16,16,power_law_1.2,0.06144639849662781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,balanced,0.08206933240095775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,balanced,0.06358399987220764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,6144,2560,8,160,16,16,power_law_1.2,0.061868798732757566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,6144,2560,8,160,16,16,power_law_1.2,0.066457599401474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,balanced,0.06505066653092702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,balanced,0.08377599716186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,6144,2560,8,160,16,16,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,balanced,0.06568000217278798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,balanced,0.08820799986521403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,6144,2560,8,160,16,16,power_law_1.2,0.07604479789733887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,balanced,0.06596800188223521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,balanced,0.0955466628074646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,6144,2560,8,160,16,16,power_law_1.2,0.07731840014457703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,balanced,0.06596266726652782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,6144,2560,8,160,16,16,power_law_1.2,0.08592640161514283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,balanced,0.0944640040397644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,balanced,0.06748266518115997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,balanced,0.11627200245857239
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,6144,2560,8,160,16,16,power_law_1.2,0.09637119770050048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,balanced,0.06746133168538411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,balanced,0.07004266480604808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,balanced,0.11530133088429768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,6144,2560,8,160,16,16,power_law_1.2,0.10206719636917114
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,balanced,0.07438399891058604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,balanced,0.13402666648228964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,balanced,0.08348266283671062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.01,0.060198402404785155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,balanced,0.08565333485603333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,6144,2560,8,160,16,16,power_law_1.2,0.12025599479675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.01,0.07011839747428894
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,balanced,0.14727999766667685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,balanced,0.09191999832789104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.01,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,6144,2560,8,160,16,16,power_law_1.2,0.14193919897079468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,balanced,0.1127306620279948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.01,0.06294400095939637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,balanced,0.22217599550882974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.01,0.06711680293083191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,balanced,0.11505599816640218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.01,0.077292799949646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,6144,2560,8,160,16,16,power_law_1.2,0.20067839622497557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,balanced,0.1381706694761912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,balanced,0.2386666735013326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.01,0.07899519801139832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,6144,2560,8,160,16,16,power_law_1.2,0.2639935970306396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.01,0.07639679908752442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,balanced,0.15692800283432007
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,6144,2560,8,160,16,16,power_law_1.2,0.3245055913925171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.01,0.0771776020526886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,balanced,0.3444960117340088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.01,0.0807424008846283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,6144,2560,8,160,16,16,power_law_1.2,0.4525887966156006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,balanced,0.22838934262593588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.01,0.08270080089569092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.01,0.08661119937896729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,6144,2560,8,160,16,16,power_law_1.2,0.6668032169342041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,balanced,0.2678826649983724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.01,0.09007359743118286
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,6144,2560,8,160,16,16,power_law_1.2,0.858739185333252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,balanced,0.4187626838684082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.01,0.09382399916648865
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.01,0.10011520385742187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,6144,2560,8,160,16,16,power_law_1.2,1.3046272277832032
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,balanced,0.3853600025177002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.01,0.10584959983825684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,6144,2560,8,160,16,16,power_law_1.2,1.8203264236450196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.01,0.1080896019935608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.01,0.12695679664611817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,6144,2560,8,160,16,16,power_law_1.2,2.8370304107666016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.01,0.1331071972846985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,balanced,0.5846720139185587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,balanced,0.48813335100809735
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.01,0.15486719608306884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,6144,2560,8,160,16,16,power_law_1.2,4.392524719238281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.01,0.20527360439300538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.01,0.2633599996566772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,6144,2560,8,160,16,16,power_law_1.2,8.947853088378906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.01,0.31245439052581786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.01,0.43509759902954104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.01,0.5960319995880127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,balanced,0.6954293251037598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.01,0.828115177154541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,balanced,0.7337013085683187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.01,1.0116352081298827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.01,1.2495807647705077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.01,0.052262401580810545
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.01,2.191654396057129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.01,0.059654402732849124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.01,0.05011839866638183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.01,3.7607872009277346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,balanced,0.8776799837748209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.01,0.05382400155067444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.01,0.05622400045394897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.01,0.06375679969787598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.01,0.06473600268363952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,balanced,0.8866079648335775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.01,0.06618239879608154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.01,0.06691840291023254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.01,0.06838399767875672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.01,0.07291520237922669
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,balanced,1.0827893416086833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.01,0.07485439777374267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.01,0.08190720081329346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.01,0.08147199749946595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.01,0.08930559754371643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,6144,2560,8,160,32,8,power_law_1.2,0.0597055971622467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.01,0.09227520227432251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,6144,2560,8,160,32,8,power_law_1.2,0.05261440277099609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.01,0.10299520492553711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,6144,2560,8,160,32,8,power_law_1.2,0.05545600056648255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.01,0.11975040435791015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,6144,2560,8,160,32,8,power_law_1.2,0.060172802209854125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,balanced,1.3976426124572754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,6144,2560,8,160,32,8,power_law_1.2,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,6144,2560,8,160,32,8,power_law_1.2,0.07444480061531067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.01,0.13192319869995117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,6144,2560,8,160,32,8,power_law_1.2,0.0785215973854065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.01,0.15946880578994752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,6144,2560,8,160,32,8,power_law_1.2,0.07585920095443725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,6144,2560,8,160,32,8,power_law_1.2,0.07957119941711426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.01,0.19701119661331176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,6144,2560,8,160,32,8,power_law_1.2,0.07992320060729981
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.01,0.25430400371551515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,6144,2560,8,160,32,8,power_law_1.2,0.08376960158348083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,balanced,1.6802773475646973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,6144,2560,8,160,32,8,power_law_1.2,0.08562560081481933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.01,0.31322879791259767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,6144,2560,8,160,32,8,power_law_1.2,0.09271039962768554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.01,0.45166721343994143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,6144,2560,8,160,32,8,power_law_1.2,0.0923583984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.01,0.5577600002288818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,6144,2560,8,160,32,8,power_law_1.2,0.1045632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,6144,2560,8,160,32,8,power_law_1.2,0.10894720554351807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.01,0.8757951736450196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,6144,2560,8,160,32,8,power_law_1.2,0.1091264009475708
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.01,1.2334976196289062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,6144,2560,8,160,32,8,power_law_1.2,0.13779840469360352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.01,1.4633407592773438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,6144,2560,8,160,32,8,power_law_1.2,0.1362496018409729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,6144,2560,8,160,32,8,power_law_1.2,0.1751423954963684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.01,2.2188159942626955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,6144,2560,8,160,32,8,power_law_1.2,0.22593278884887696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,6144,2560,8,160,32,8,power_law_1.2,0.288044810295105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.01,5.1084545135498045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,6144,2560,8,160,32,8,power_law_1.2,0.3669696092605591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,6144,2560,8,160,32,8,power_law_1.2,0.46935038566589354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,6144,2560,8,160,32,8,power_law_1.2,0.6716224193572998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,6144,2560,8,160,32,8,power_law_1.2,0.9790911674499512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,6144,2560,8,160,32,8,power_law_1.2,1.2805248260498048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,6144,2560,8,160,32,8,power_law_1.2,1.436742401123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,6144,2560,8,160,32,8,power_law_1.2,2.3253055572509767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,power_law_1.2,5.533260726928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,6144,2560,8,160,32,8,balanced,2.72217591603597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,balanced,3.3702828089396157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,6144,2560,8,160,32,8,power_law_1.2,0.05004159808158874
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,6144,2560,8,160,32,8,power_law_1.2,0.04863359928131104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,6144,2560,8,160,32,8,power_law_1.2,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,6144,2560,8,160,32,8,power_law_1.2,0.05240960121154785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,6144,2560,8,160,32,8,power_law_1.2,0.05422719717025757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,6144,2560,8,160,32,8,power_law_1.2,0.05927680134773254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,6144,2560,8,160,32,8,power_law_1.2,0.06111360192298889
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,6144,2560,8,160,32,8,power_law_1.2,0.06223999857902527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,6144,2560,8,160,32,8,power_law_1.2,0.06431999802589417
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,6144,2560,8,160,32,8,power_law_1.2,0.06618880033493042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,6144,2560,8,160,32,8,power_law_1.2,0.06982399821281433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,6144,2560,8,160,32,8,power_law_1.2,0.07489280104637146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,6144,2560,8,160,32,8,power_law_1.2,0.07913600206375122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,6144,2560,8,160,32,8,power_law_1.2,0.0791167974472046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,6144,2560,8,160,32,8,power_law_1.2,0.08783360123634339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,6144,2560,8,160,32,8,power_law_1.2,0.09376639723777772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,6144,2560,8,160,32,8,power_law_1.2,0.1045632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,6144,2560,8,160,32,8,power_law_1.2,0.12646399736404418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,6144,2560,8,160,32,8,power_law_1.2,0.12957439422607422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,balanced,0.11928533514340718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,6144,2560,8,160,32,8,power_law_1.2,0.16563839912414552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,balanced,0.11401066184043884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,balanced,0.11788800358772278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,6144,2560,8,160,32,8,power_law_1.2,0.2125312089920044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,balanced,0.12033599615097046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,6144,2560,8,160,32,8,power_law_1.2,0.293939208984375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,balanced,0.12033599615097046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,balanced,0.20196266969045004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,6144,2560,8,160,32,8,power_law_1.2,0.3399104118347168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,balanced,0.28246400753657025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,6144,2560,8,160,32,8,power_law_1.2,0.5052480220794677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,balanced,0.28180267413457233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,6144,2560,8,160,32,8,power_law_1.2,0.6717631816864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,balanced,0.2893173297246297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,balanced,0.28325867652893066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,6144,2560,8,160,32,8,power_law_1.2,1.0159040451049806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,balanced,0.2831520040829976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,balanced,0.26523733139038086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,6144,2560,8,160,32,8,power_law_1.2,1.4514816284179688
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,balanced,0.2800160050392151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,balanced,0.27525333563486737
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,6144,2560,8,160,32,8,power_law_1.2,1.9161407470703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,balanced,0.27612799406051636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,6144,2560,8,160,32,8,power_law_1.2,2.685536003112793
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,balanced,0.28279467423756915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,balanced,0.28773866097132367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,6144,2560,8,160,32,8,power_law_1.2,6.007545471191406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,balanced,0.2770986755688985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,balanced,0.29097600777943927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,balanced,0.30060799916585285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,balanced,0.31062400341033936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,balanced,0.317466676235199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,balanced,0.077674667040507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,balanced,0.31996800502141315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,balanced,0.07913066446781158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,balanced,0.0795306662718455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,balanced,0.08011733492215474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,balanced,0.08181866506735484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,balanced,0.3232373396555583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,balanced,0.13109333316485086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,balanced,0.16925867398579916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,balanced,0.16914665699005127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,balanced,0.16550399859746298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,balanced,0.17174400885899863
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,balanced,0.17363200585047403
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,balanced,0.5967093308766683
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,balanced,0.18460800250371298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,balanced,0.18134933710098267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,balanced,0.1810879906018575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,balanced,0.17981332540512085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,balanced,0.17681066195170084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,balanced,0.19210133949915567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,balanced,0.58897598584493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,balanced,0.046223998069763184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,balanced,0.19298666715621948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,balanced,0.2034026583035787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,balanced,0.046682665745417275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,balanced,0.21741332610448202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,balanced,0.04665066798528036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,balanced,0.04885333279768626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,balanced,0.24637866020202637
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.01,0.17494399547576905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.01,0.27005441188812257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,balanced,0.04986133178075155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.01,0.16219520568847656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,balanced,0.06233599781990051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.01,0.27672319412231444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,balanced,0.2746453285217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,balanced,0.8900213241577148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,balanced,0.06943466762701671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.01,0.17167359590530396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.01,0.27125120162963867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,balanced,0.07026133437951405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,balanced,0.3094346721967061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.01,0.1382464051246643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.01,0.1942720055580139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,balanced,0.07005866865317027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,balanced,0.07046933472156525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.01,0.16406400203704835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.01,0.24654719829559327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,balanced,0.07155733307202657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.01,0.15219839811325073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.01,0.2468928098678589
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,balanced,0.3626399834950765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,balanced,0.07293866574764252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.01,0.14266879558563234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.01,0.2612799882888794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,balanced,0.07420800129572551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.01,0.145632004737854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.01,0.24503679275512696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,balanced,0.07504533231258392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,power_law_1.01,0.06599040031433105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.01,0.16858240365982055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.01,0.27112319469451907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,balanced,1.14573868115743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,balanced,0.08246933420499165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,balanced,0.5533546606699625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,power_law_1.01,0.06214399933815003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.01,0.17568000555038452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.01,0.27409920692443845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,balanced,0.08241066833337148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,power_law_1.01,0.06039040088653565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.01,0.26379520893096925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.01,0.17722879648208617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,balanced,0.08711466193199158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,power_law_1.01,0.05811200141906738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.01,0.2393280029296875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.01,0.161900794506073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,balanced,0.09591999650001526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.01,0.2687488079071045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,power_law_1.01,0.06302080154418946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.01,0.16544640064239502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,balanced,0.6650506655375162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.01,0.2699968099594116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,power_law_1.01,0.06600319743156433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.01,0.16940159797668458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.01,0.2518784046173096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,balanced,0.10659199953079224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,power_law_1.01,0.06490880250930786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.01,0.1627519965171814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.01,0.24899840354919434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,power_law_1.01,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.01,0.16327680349349977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.01,0.25966720581054686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,power_law_1.01,0.06899200081825256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.01,0.17429120540618898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.01,0.2347520112991333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,power_law_1.01,0.06748800277709961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.01,0.17791999578475953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.01,0.26277120113372804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,power_law_1.01,0.07146880030632019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,balanced,0.9266239802042643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.01,0.19347840547561646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.01,0.3518847942352295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,balanced,0.12307733297348022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,power_law_1.01,0.07116159796714783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,balanced,1.687503973642985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.01,0.22644479274749757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.01,0.41653761863708494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,power_law_1.01,0.07574399709701538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,balanced,0.13902933398882547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.01,0.3093951940536499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.01,0.5625472068786621
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,power_law_1.01,0.07785599827766418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.01,0.3961407899856567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.01,0.6553984165191651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,balanced,0.16925867398579916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.01,0.9009984016418457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.01,0.4435455799102783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,power_law_1.01,0.08377599716186523
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.01,1.025068759918213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.01,0.649894380569458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,power_law_1.01,0.0870464026927948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.01,1.7299903869628905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.01,0.8500415802001953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,power_law_1.01,0.09715840220451355
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,balanced,1.172271966934204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.01,2.411347198486328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.01,1.2618176460266113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,power_law_1.01,0.115065598487854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.01,2.9074047088623045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.01,1.5990655899047852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,balanced,0.20266666014989218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,power_law_1.01,0.1366912007331848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.01,5.117529678344726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.01,2.156185531616211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.01,3.1826623916625976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.01,9.832326507568359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,balanced,0.26069867610931396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,power_law_1.01,0.15461119413375854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.01,6.219635009765625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,2,128,power_law_1.2,0.27431039810180663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,power_law_1.01,0.1921023964881897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,power_law_1.01,0.2554879903793335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,2,128,power_law_1.2,0.2747136116027832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,2,128,power_law_1.2,0.2610111951828003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,balanced,1.8061493237813313
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,2,128,power_law_1.2,0.21242880821228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,power_law_1.01,0.302892804145813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,2,128,power_law_1.2,0.22525439262390137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,power_law_1.01,0.44618239402771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,balanced,0.3307146628697713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,2,128,power_law_1.2,0.27577600479125974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,2,128,power_law_1.2,0.22521600723266602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,2,128,power_law_1.2,0.17371519804000854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,power_law_1.01,0.5681471824645996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,balanced,3.1059306462605796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,2,128,power_law_1.2,0.28129920959472654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,2,128,power_law_1.2,0.1678015947341919
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,power_law_1.01,0.7787839889526367
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,2,128,power_law_1.2,0.26320641040802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,2,128,power_law_1.2,0.17020800113677978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,balanced,0.45402665932973224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,2,128,power_law_1.2,0.22495360374450685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,2,128,power_law_1.2,0.11969280242919922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,2,128,power_law_1.2,0.24309759140014647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,power_law_1.01,1.1384832382202148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,2,128,power_law_1.2,0.12654080390930175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,2,128,power_law_1.2,0.1376960039138794
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,2,128,power_law_1.2,0.24296960830688477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,power_law_1.01,1.4780159950256349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,2,128,power_law_1.2,0.1518399953842163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,2,128,power_law_1.2,0.2755903959274292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,2,128,power_law_1.2,0.15708160400390625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,power_law_1.01,2.166156768798828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,2,128,power_law_1.2,0.22189440727233886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,2,128,power_law_1.2,0.1533568024635315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,2,128,power_law_1.2,0.24705278873443604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,power_law_1.01,4.23955192565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,2,128,power_law_1.2,0.16265599727630614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,2,128,power_law_1.2,0.22831358909606933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,balanced,0.5963040192921957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,2,128,power_law_1.2,0.17134720087051392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,2,128,power_law_1.2,0.23681919574737548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,2,128,power_law_1.2,0.15980160236358643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,2,128,power_law_1.2,0.2661247968673706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,2,128,power_law_1.2,0.15978879928588868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,2,128,power_law_1.2,0.15044480562210083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,2,128,power_law_1.2,0.341977596282959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,2,128,power_law_1.2,0.1753983974456787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,2,128,power_law_1.2,0.1733247995376587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,2,128,power_law_1.2,0.40621438026428225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,2,128,power_law_1.2,0.17241599559783935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,2,128,power_law_1.2,0.5180416107177734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,2,128,power_law_1.2,0.1718783974647522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,balanced,3.444373448689779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,2,128,power_law_1.2,0.6042687892913818
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,2,128,power_law_1.2,0.2144767999649048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,balanced,0.7376159826914469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,2,128,power_law_1.2,0.26528639793395997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,2,128,power_law_1.2,0.9272959709167481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,2,128,power_law_1.2,0.3377088069915771
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,2,128,power_law_1.2,1.2131199836730957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,2,128,power_law_1.2,0.4383232116699219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,2,128,power_law_1.2,1.7638847351074218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,2,128,power_law_1.2,0.5850624084472656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,2,128,power_law_1.2,2.7769535064697264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,2,128,power_law_1.2,0.933471965789795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,2,128,power_law_1.2,3.9547840118408204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,2,128,power_law_1.2,1.1447104454040526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,2,128,power_law_1.2,4.472684860229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,2,128,power_law_1.2,1.4790271759033202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,2,128,power_law_1.2,2.392767906188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,2,128,power_law_1.2,7.020864105224609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,2,128,power_law_1.2,2.8575872421264648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,balanced,1.1485599676767986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,2,128,power_law_1.2,15.397804260253906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,2,128,power_law_1.2,5.935321426391601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,2,128,power_law_1.2,9.929920196533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,balanced,2.2643359502156577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,2,128,power_law_1.2,0.06273279786109924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,2,128,power_law_1.2,0.06267520189285278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,2,128,power_law_1.2,0.061273598670959474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,2,128,power_law_1.2,0.05924479961395264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,balanced,0.0832479993502299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,2,128,power_law_1.2,0.06043519973754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,2,128,power_law_1.2,0.06507520079612732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,balanced,0.0817440003156662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,2,128,power_law_1.2,0.06416000127792358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,balanced,0.08255466818809509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,2,128,power_law_1.2,0.06770560145378113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,balanced,0.0863200028737386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,2,128,power_law_1.2,0.06658560037612915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,balanced,0.11460266510645549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,balanced,0.19402666886647543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,2,128,power_law_1.2,0.06910719871520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,balanced,0.27453867594401044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,2,128,power_law_1.2,0.07281919717788696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,balanced,0.0692853331565857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,balanced,0.2858026623725891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,2,128,power_law_1.2,0.07208319902420043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,balanced,0.06911999980608623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,balanced,0.29029866059621173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,2,128,power_law_1.2,0.07126399874687195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,balanced,0.07075733443101247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,balanced,0.28252265850702923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,balanced,0.07114666700363159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,2,128,power_law_1.2,0.07956479787826538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,balanced,0.27983999252319336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,balanced,0.08202666540940602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,2,128,power_law_1.2,0.08568959832191467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,balanced,0.13132799665133157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,balanced,0.2800266742706299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,2,128,power_law_1.2,0.09296000003814697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,balanced,0.16921599706013998
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,balanced,0.304362674554189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,2,128,power_law_1.2,0.10440319776535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,balanced,0.1851039926211039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,balanced,0.29070399204889935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,2,128,power_law_1.2,0.12905600070953369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,balanced,0.1722559928894043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,balanced,0.27294933795928955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,balanced,0.1777120033899943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,2,128,power_law_1.2,0.16417280435562134
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,balanced,0.2936906615893046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,balanced,0.186191995938619
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,balanced,0.2929226756095886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,balanced,0.17112533251444498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,balanced,0.18774400154749551
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,2,128,power_law_1.2,0.18202879428863525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,balanced,0.27748799324035645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,balanced,0.18127467234929404
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,2,128,power_law_1.2,0.21564159393310547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,balanced,0.2884426712989807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,balanced,0.16918933391571045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,2,128,power_law_1.2,0.3156928062438965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,balanced,0.17282134294509888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,balanced,0.29231999317804974
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,balanced,0.18105065822601318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,2,128,power_law_1.2,0.396780800819397
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,balanced,0.3036800026893616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,balanced,0.19530133406321207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,2,128,power_law_1.2,0.5868095874786377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,balanced,0.20361065864562988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,balanced,0.04518933097521464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.01,0.2594111919403076
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,balanced,0.32685865958531696
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,balanced,0.045850664377212524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,balanced,0.225983997186025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.01,0.2668864011764526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,2,128,power_law_1.2,0.7417088031768799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.01,0.28192639350891113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,balanced,0.047872001926104225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,balanced,0.32939199606577557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.01,0.14675840139389038
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,balanced,0.25334399938583374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,2,128,power_law_1.2,1.1316224098205567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,balanced,0.05005866785844167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.01,0.18676480054855346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,balanced,0.06329066554705302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.01,0.20366079807281495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,balanced,0.0690719981988271
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,balanced,0.28248000144958496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,2,128,power_law_1.2,1.4950336456298827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.01,0.24542720317840577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,balanced,0.06940266489982605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,balanced,0.33956801891326904
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.01,0.24046719074249268
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,balanced,0.07028266787528992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,2,128,power_law_1.2,1.8967296600341796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.01,0.23928320407867432
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,balanced,0.07010666529337566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,balanced,0.31329067548116046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.01,0.25423359870910645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,balanced,0.0718560020128886
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,2,128,power_law_1.2,3.382252883911133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.01,0.22880001068115235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,balanced,0.07397866745789845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.01,0.2364288091659546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,balanced,0.6351840098698934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,balanced,0.0746559997399648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.01,0.2652224063873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,2,128,power_law_1.2,6.814195251464843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,balanced,0.3757866621017456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,balanced,0.07598400115966797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.01,0.25971839427947996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,balanced,0.08294933537642162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.01,0.24220800399780273
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.01,0.2504703998565674
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,balanced,0.08348266283671062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.01,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,balanced,0.08890666564305623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.01,0.27002880573272703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,balanced,0.5898826519648234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.01,0.1654144048690796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,balanced,0.09752000371615092
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.01,0.30845439434051514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,balanced,0.6188053290049235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.01,0.16970239877700805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.01,0.3588223934173584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.01,0.3791743993759155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.01,0.16970880031585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,balanced,0.1074186662832896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.01,0.5109824180603028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.01,0.10748800039291381
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.01,0.5844992160797119
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.01,0.12380160093307495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,power_law_1.01,0.07009919881820678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.01,0.8671487808227539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,balanced,0.6942880153656006
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.01,0.1201856017112732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.01,1.0253631591796875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,power_law_1.01,0.06387839913368225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.01,0.14479360580444336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,balanced,0.9185333251953125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,power_law_1.01,0.06335359811782837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.01,1.5062335968017577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.01,0.1617535948753357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,balanced,0.12711999813715616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,power_law_1.01,0.05493119955062866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.01,1.9830976486206056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.01,0.15427839756011963
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,power_law_1.01,0.05790079832077026
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,balanced,0.1455573340257009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.01,0.1674880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,power_law_1.01,0.061926400661468504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.01,2.2083391189575194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.01,0.16729600429534913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,power_law_1.01,0.06428160071372986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,balanced,0.17654933532079062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.01,0.1525823950767517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,balanced,0.9626560211181641
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.01,3.476095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,power_law_1.01,0.06672000288963317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.01,0.147980797290802
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,power_law_1.01,0.06781439781188965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.01,0.16230399608612062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,power_law_1.01,0.06887680292129517
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.01,7.171961975097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.01,0.17374080419540405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,power_law_1.01,0.07203840017318726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.01,0.18439040184020997
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,balanced,1.2356639703114827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,power_law_1.01,0.07431679964065552
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.01,0.17369600534439086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,power_law_1.01,0.0753920018672943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.01,0.17816319465637206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,balanced,0.21424533923467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,power_law_1.01,0.07919999957084656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.01,0.19510400295257568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,power_law_1.01,0.08579840064048767
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.01,0.24254720211029052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,4,64,power_law_1.2,0.29802238941192627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,power_law_1.01,0.0870848000049591
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,balanced,1.2468799750010173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.01,0.2847104072570801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,balanced,0.27658132712046307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,4,64,power_law_1.2,0.29190399646759035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,power_law_1.01,0.09779199957847595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.01,0.37995519638061526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,power_law_1.01,0.1128383994102478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,4,64,power_law_1.2,0.2812288045883179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.01,0.425113582611084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,4,64,power_law_1.2,0.17077759504318238
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.01,0.5770624160766602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,power_law_1.01,0.13177599906921386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,4,64,power_law_1.2,0.19385600090026855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.01,0.7719935894012451
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,4,64,power_law_1.2,0.22071681022644044
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.01,1.1935487747192384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,4,64,power_law_1.2,0.2128511905670166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,power_law_1.01,0.16197760105133058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,balanced,0.3575040102005005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,4,64,power_law_1.2,0.24717440605163574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,power_law_1.01,0.18284800052642822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.01,1.4777791976928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,balanced,1.840511957804362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,4,64,power_law_1.2,0.23269760608673096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,power_law_1.01,0.25089919567108154
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.01,2.0241535186767576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,4,64,power_law_1.2,0.25677440166473386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,4,64,power_law_1.2,0.2690752029418945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.01,2.9470848083496093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,power_law_1.01,0.3306368112564087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,4,64,power_law_1.2,0.24174718856811522
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,balanced,0.4992106755574544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,power_law_1.01,0.4817344188690186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,4,64,power_law_1.2,0.2730304002761841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.01,5.855526351928711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,balanced,1.9000585873921711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,4,64,power_law_1.2,0.2694272041320801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,power_law_1.01,0.5665535926818848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,4,64,power_law_1.2,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,power_law_1.01,0.8564672470092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,4,64,power_law_1.2,0.2509887933731079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,4,64,power_law_1.2,0.2496256113052368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,4,64,power_law_1.2,0.2963583946228027
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,power_law_1.01,1.1164863586425782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,4,64,power_law_1.2,0.31308159828186033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,balanced,0.6736319859822592
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,4,64,power_law_1.2,0.35890560150146483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,4,64,power_law_1.2,0.44374399185180663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,power_law_1.01,1.375539207458496
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,4,64,power_law_1.2,0.574617576599121
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,power_law_1.01,2.3522111892700197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,4,64,power_law_1.2,0.8195520401000976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,4,64,power_law_1.2,1.0124992370605468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,power_law_1.01,4.6154624938964846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,4,64,power_law_1.2,1.3696831703186034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,4,64,power_law_1.2,2.1137664794921873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,balanced,0.8305919965108236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,4,64,power_law_1.2,2.6633279800415037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,4,64,power_law_1.2,3.3095169067382812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,4,64,power_law_1.2,4.76110725402832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,balanced,3.3107999165852866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,4,64,power_law_1.2,11.973868560791015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,balanced,3.619584083557129
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,balanced,1.2949706713358562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,4,64,power_law_1.2,0.1673408031463623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,4,64,power_law_1.2,0.1625983953475952
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,4,64,power_law_1.2,0.1676095962524414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,4,64,power_law_1.2,0.10947840213775635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,4,64,power_law_1.2,0.1240447998046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,4,64,power_law_1.2,0.1180351972579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,4,64,power_law_1.2,0.13539199829101561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,4,64,power_law_1.2,0.1566975951194763
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,4,64,power_law_1.2,0.15152000188827514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,4,64,power_law_1.2,0.14088959693908693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,4,64,power_law_1.2,0.15559680461883546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,4,64,power_law_1.2,0.16306560039520263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,4,64,power_law_1.2,0.16349439620971679
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,4,64,power_law_1.2,0.16284799575805664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,4,64,power_law_1.2,0.16558079719543456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,4,64,power_law_1.2,0.18099839687347413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,4,64,power_law_1.2,0.15255680084228515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,4,64,power_law_1.2,0.2019263982772827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,balanced,2.5295093854268393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,4,64,power_law_1.2,0.22614400386810302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,4,64,power_law_1.2,0.26997759342193606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,4,64,power_law_1.2,0.3151808023452759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,4,64,power_law_1.2,0.42989439964294435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,4,64,power_law_1.2,0.5234496116638183
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,4,64,power_law_1.2,0.684665584564209
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,4,64,power_law_1.2,1.0033920288085938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,4,64,power_law_1.2,0.06653439998626709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,4,64,power_law_1.2,1.44901123046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,4,64,power_law_1.2,0.06316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,4,64,power_law_1.2,0.06053760051727295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,4,64,power_law_1.2,1.8536447525024413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,4,64,power_law_1.2,0.0546176016330719
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,4,64,power_law_1.2,2.3779199600219725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,4,64,power_law_1.2,0.056857597827911374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,4,64,power_law_1.2,0.06106879711151123
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,4,64,power_law_1.2,4.460089492797851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,4,64,power_law_1.2,0.06079360246658325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,4,64,power_law_1.2,0.06686720252037048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,4,64,power_law_1.2,8.063488006591797
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,4,64,power_law_1.2,0.06787840127944947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,4,64,power_law_1.2,0.06995199918746949
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,4,64,power_law_1.2,0.0697983980178833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,balanced,0.06798933446407318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,balanced,0.06906133393446605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,4,64,power_law_1.2,0.07422720193862915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,balanced,0.06990399956703186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,4,64,power_law_1.2,0.07519360184669495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,balanced,0.08865066369374593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,4,64,power_law_1.2,0.07860479950904846
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,balanced,0.11380267143249512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,balanced,0.20566399892171225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,4,64,power_law_1.2,0.08648319840431214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,balanced,0.2798186739285787
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,balanced,0.2905813256899516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,4,64,power_law_1.2,0.0889792025089264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,balanced,0.2738986611366272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,4,64,power_law_1.2,0.10440319776535034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,balanced,0.29100799560546875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,balanced,0.29121599594751996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,4,64,power_law_1.2,0.12551039457321167
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,balanced,0.27753599484761554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,balanced,0.28917332490285236
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,4,64,power_law_1.2,0.1419327974319458
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,balanced,0.2920479973157247
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,balanced,0.286954661210378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,balanced,0.2942453424135844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,4,64,power_law_1.2,0.17432960271835327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,balanced,0.27826666831970215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,4,64,power_law_1.2,0.20774400234222412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,balanced,0.2816693385442098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,4,64,power_law_1.2,0.299289608001709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,balanced,0.2948746681213379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,balanced,0.058874666690826416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,balanced,0.28576000531514484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,4,64,power_law_1.2,0.3777472019195557
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,balanced,0.0589279979467392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,balanced,0.31114667654037476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,4,64,power_law_1.2,0.6052544116973877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,balanced,0.06072533130645752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,balanced,0.07337599992752075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,4,64,power_law_1.2,0.7590784072875977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,balanced,0.3227893312772115
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,balanced,0.08784000078837077
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,4,64,power_law_1.2,1.1642815589904785
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,balanced,0.1335040032863617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,balanced,0.18381333351135254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,balanced,0.3396426836649577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,4,64,power_law_1.2,1.6064319610595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,balanced,0.19107200702031454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.01,0.20269439220428467
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,balanced,0.17895466089248657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,4,64,power_law_1.2,2.0069759368896483
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.01,0.28168959617614747
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,balanced,0.18530132373174033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,balanced,0.35919467608133954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,balanced,0.19284266233444214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,4,64,power_law_1.2,3.225254440307617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.01,0.2758527994155884
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,balanced,0.18743999799092612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.01,0.12967679500579835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,4,64,power_law_1.2,6.527526092529297
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,balanced,0.19549334049224854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.01,0.12835839986801148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,balanced,0.04555733501911163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,balanced,0.19476799170176187
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.01,0.19719680547714233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,balanced,0.6620746850967407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,balanced,0.04600533346335093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.01,0.13772159814834595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,balanced,0.19389333327611288
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,balanced,0.046240001916885376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.01,0.19383039474487304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,balanced,0.18337599436442056
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.01,0.18383359909057617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,balanced,0.04860266546408335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.01,0.23340160846710206
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,balanced,0.19430400927861533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.01,0.18315520286560058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,balanced,0.05259733398755392
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.01,0.2371135950088501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.01,0.08204159736633301
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,balanced,0.21130667130152384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,balanced,0.06330133477846782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.01,0.24117119312286378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.01,0.10432000160217285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,balanced,0.07252266506354015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,balanced,0.22241600354512533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,balanced,0.6595946550369263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.01,0.24216959476470948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,balanced,0.07415466507275899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.01,0.12575360536575317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,balanced,0.07438399891058604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,balanced,0.2428213357925415
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.01,0.25999999046325684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.01,0.14079999923706055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,balanced,0.0746666689713796
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.01,0.2461184024810791
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.01,0.1598528027534485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,balanced,0.0759626676638921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,balanced,0.257968008518219
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.01,0.1773311972618103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.01,0.241759991645813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,balanced,0.0779306689898173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.01,0.16910719871520996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,balanced,0.07903466622034709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.01,0.23618559837341307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,balanced,0.29311466217041016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.01,0.17148799896240235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,balanced,0.08044266700744629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.01,0.26732800006866453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.01,0.16030720472335816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,balanced,0.9959786732991537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,balanced,0.08778132994969685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.01,0.24056320190429686
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.01,0.17241599559783935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,balanced,0.08842133482297261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,balanced,0.33668267726898193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.01,0.16935039758682252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.01,0.2669248104095459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,balanced,0.09402133027712505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.01,0.17271679639816284
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.01,0.17520639896392823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.01,0.2899712085723877
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,balanced,0.10486933588981628
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.01,0.17968000173568727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.01,0.3236288070678711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,balanced,0.4070613384246826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.01,0.1975872039794922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.01,0.3898112058639526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.01,0.215500807762146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,balanced,0.12044266859690349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.01,0.45830402374267576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.01,0.25077118873596194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.01,0.5561024188995362
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.01,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,balanced,0.6220213174819946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,balanced,1.319200038909912
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.01,0.7185088157653808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.01,0.3638783931732178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.01,0.43030400276184083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.01,0.9585599899291992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,balanced,0.1395840048789978
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.01,0.6143167972564697
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.01,1.2995583534240722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.01,0.8110143661499023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,balanced,0.16090666254361471
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.01,1.5895296096801759
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.01,1.1417344093322754
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.01,1.9294143676757813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,balanced,0.7489439646402994
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.01,1.4357760429382325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,balanced,0.19699199994405112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.01,3.0368511199951174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.01,1.8078975677490234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.01,3.0346752166748048
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.01,6.419750213623047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,power_law_1.01,0.06675840020179749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.01,5.640063858032226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,power_law_1.01,0.0710207998752594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,balanced,0.2445919911066691
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,power_law_1.01,0.06704000234603882
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,balanced,1.0435093243916829
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,balanced,1.9787359237670898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,power_law_1.01,0.05576320290565491
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,power_law_1.01,0.05882880091667175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,balanced,0.32393066088358563
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,power_law_1.01,0.062105602025985716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,power_law_1.01,0.06255360245704651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,power_law_1.01,0.06862720251083373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,power_law_1.01,0.06912639737129211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,power_law_1.01,0.07138559818267823
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,power_law_1.01,0.07404800057411194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,balanced,1.3379200299580891
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,power_law_1.01,0.07663360238075256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,balanced,0.4366026719411214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,power_law_1.01,0.08048639893531799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,8,32,power_law_1.2,0.20764799118041993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,power_law_1.01,0.082259202003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,power_law_1.01,0.09008640050888062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,8,32,power_law_1.2,0.2873791933059692
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,power_law_1.01,0.09286400079727172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,8,32,power_law_1.2,0.2700223922729492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,power_law_1.01,0.10594559907913208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,8,32,power_law_1.2,0.10661760568618775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,balanced,0.6139520009358724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,power_law_1.01,0.12315520048141479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,8,32,power_law_1.2,0.15275520086288452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,8,32,power_law_1.2,0.1900607943534851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,power_law_1.01,0.1503167986869812
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,8,32,power_law_1.2,0.2016832113265991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,8,32,power_law_1.2,0.25890560150146485
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,8,32,power_law_1.2,0.20896639823913574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,power_law_1.01,0.16826879978179932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,balanced,2.060314655303955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,8,32,power_law_1.2,0.24442241191864014
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,power_law_1.01,0.20555520057678223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,8,32,power_law_1.2,0.24202239513397217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,power_law_1.01,0.28399999141693116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,8,32,power_law_1.2,0.24229118824005128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,balanced,0.8206559816996256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,8,32,power_law_1.2,0.24842240810394287
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,balanced,3.6481653849283853
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,power_law_1.01,0.36992640495300294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,8,32,power_law_1.2,0.2462143898010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,power_law_1.01,0.5221248149871827
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,8,32,power_law_1.2,0.2575551986694336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,8,32,power_law_1.2,0.2594239950180054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,8,32,power_law_1.2,0.25528318881988527
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,power_law_1.01,0.647327995300293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,8,32,power_law_1.2,0.2883903980255127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,power_law_1.01,0.9065728187561035
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,balanced,1.0134399731953938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,8,32,power_law_1.2,0.30969600677490233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,8,32,power_law_1.2,0.35228159427642824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,power_law_1.01,1.3037376403808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,8,32,power_law_1.2,0.41071357727050783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,power_law_1.01,1.6175039291381836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,8,32,power_law_1.2,0.5744383811950684
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,power_law_1.01,2.415059280395508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,8,32,power_law_1.2,0.13532160520553588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,8,32,power_law_1.2,0.6158527851104736
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,8,32,power_law_1.2,0.1753216028213501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,8,32,power_law_1.2,0.8430015563964843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,power_law_1.01,4.8886463165283205
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,8,32,power_law_1.2,0.14507520198822021
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,8,32,power_law_1.2,1.312390422821045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,8,32,power_law_1.2,0.10264960527420045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,8,32,power_law_1.2,0.10673279762268066
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,8,32,power_law_1.2,1.507692813873291
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,8,32,power_law_1.2,0.13344000577926635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,8,32,power_law_1.2,1.950828742980957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,8,32,power_law_1.2,0.13945599794387817
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,8,32,power_law_1.2,0.16328959465026854
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,8,32,power_law_1.2,2.452128028869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,8,32,power_law_1.2,0.15845760107040405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,balanced,1.5788960456848145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,8,32,power_law_1.2,0.15544960498809815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,8,32,power_law_1.2,4.468409729003906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,8,32,power_law_1.2,0.15585919618606567
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,balanced,3.952805201212565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,8,32,power_law_1.2,0.15500799417495728
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,8,32,power_law_1.2,9.495916748046875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,8,32,power_law_1.2,0.1607807993888855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,8,32,power_law_1.2,0.165721595287323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,8,32,power_law_1.2,0.1647104024887085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,8,32,power_law_1.2,0.18101760149002075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,8,32,power_law_1.2,0.1744447946548462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,8,32,power_law_1.2,0.19721599817276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,8,32,power_law_1.2,0.2134399890899658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,8,32,power_law_1.2,0.28097920417785643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,8,32,power_law_1.2,0.31472001075744627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,8,32,power_law_1.2,0.4073472023010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,8,32,power_law_1.2,0.49718399047851564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,8,32,power_law_1.2,0.6774464130401612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,8,32,power_law_1.2,0.8879743576049804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,8,32,power_law_1.2,1.3591744422912597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,8,32,power_law_1.2,1.7783231735229492
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,8,32,power_law_1.2,2.1002559661865234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,8,32,power_law_1.2,3.152742385864258
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,balanced,0.05482133229573568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,8,32,power_law_1.2,7.3456062316894535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,balanced,0.05542933444182078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,balanced,0.05608533322811127
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,8,32,power_law_1.2,0.06673920154571533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,balanced,0.059024001161257424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,8,32,power_law_1.2,0.07115520238876342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,balanced,0.0666133314371109
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,8,32,power_law_1.2,0.06405760049819946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,balanced,3.0872745513916016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,balanced,0.07938133180141449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,8,32,power_law_1.2,0.05296639800071716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,balanced,0.09446932872136433
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,8,32,power_law_1.2,0.05957760214805603
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,balanced,0.0958720048268636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,balanced,0.0950933297475179
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,8,32,power_law_1.2,0.06284800171852112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,balanced,0.09703466296195984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,8,32,power_law_1.2,0.06613119840621948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,balanced,0.09829333424568176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,8,32,power_law_1.2,0.06909440159797668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,balanced,0.10079466303189595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,8,32,power_law_1.2,0.06822400093078614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,balanced,0.10059733192125957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,8,32,power_law_1.2,0.07108479738235474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,balanced,0.10345600048700969
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,8,32,power_law_1.2,0.07095040082931518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,balanced,0.10897599657376607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,8,32,power_law_1.2,0.07683839797973632
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,balanced,0.1111893355846405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,8,32,power_law_1.2,0.08121600151062011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,balanced,0.1150986651579539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,8,32,power_law_1.2,0.08296959996223449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,balanced,0.12482666969299316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,8,32,power_law_1.2,0.09114879965782166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,balanced,0.13633066415786743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,8,32,power_law_1.2,0.09565439820289612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,balanced,0.15825066963831583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,8,32,power_law_1.2,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,8,32,power_law_1.2,0.1315840005874634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,balanced,0.18128534158070883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,8,32,power_law_1.2,0.14627200365066528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,balanced,0.22106132904688516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,balanced,0.04860800007979075
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,balanced,0.04837866624196371
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,8,32,power_law_1.2,0.1930176019668579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,balanced,0.049285332361857094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,balanced,0.2569013237953186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,8,32,power_law_1.2,0.23400321006774902
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,balanced,0.05276266733805338
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,8,32,power_law_1.2,0.3112191915512085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,balanced,0.06271466612815857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,balanced,0.0676746666431427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,balanced,0.3341493209203084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,balanced,0.0796319991350174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,balanced,0.0799786647160848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,8,32,power_law_1.2,0.4079296112060547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,balanced,0.08032533526420593
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,8,32,power_law_1.2,0.6060800075531005
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,balanced,0.08099733293056488
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,balanced,0.08277333279450734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,balanced,0.41732800006866455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,balanced,0.0849120020866394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,balanced,0.08654933174451192
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,8,32,power_law_1.2,0.8120960235595703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,balanced,0.08823999762535095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,8,32,power_law_1.2,1.2295552253723145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,balanced,0.09557333588600159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,balanced,0.09829866886138916
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,balanced,0.10351999600728352
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,8,32,power_law_1.2,1.725369644165039
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,balanced,0.5828320185343424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,balanced,0.11599999666213989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,8,32,power_law_1.2,2.079443168640137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,balanced,0.13083199659983316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,8,32,power_law_1.2,3.4846912384033204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,balanced,0.1553866664568583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,balanced,0.1859253247578939
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,8,32,power_law_1.2,6.377043151855469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,balanced,0.04717866579691569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,balanced,0.23280000686645508
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,balanced,0.7368053595225016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,balanced,0.04785066843032837
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,balanced,0.04965866605440775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,balanced,0.05320000151793162
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,balanced,0.28670400381088257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,balanced,0.05863999823729197
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,balanced,0.06937066713968913
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,balanced,0.08146666487058003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,balanced,0.08319999774297078
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,balanced,0.08338666955629985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,balanced,0.3890666564305623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,balanced,0.0842026670773824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,balanced,0.08603733777999878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,balanced,0.08800533413887024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,balanced,0.08966400225957234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.01,0.07093759775161743
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,balanced,0.8979413509368896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,balanced,0.09186666210492452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,balanced,0.5001173416773478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.01,0.05847039818763733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,balanced,0.09994133313496907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.01,0.08664960265159607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,balanced,0.10071466366449992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.01,0.06859520077705383
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.01,0.09337599873542786
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,balanced,0.10853333274523418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,balanced,0.12070932984352112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.01,0.07550719976425171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.01,0.0677183985710144
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.01,0.07132800221443177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.01,0.055225598812103274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.01,0.07486720085144043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,balanced,0.14036800463994345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.01,0.06044800281524658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,balanced,0.7150879700978597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.01,0.07816960215568543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.01,0.06284160017967225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.01,0.08293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.01,0.06561920046806335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.01,0.08504319787025452
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.01,0.07152640223503112
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.01,0.07107840180397033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.01,0.08481919765472412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,balanced,0.16607466340065002
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.01,0.08743039965629577
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.01,0.07519360184669495
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,balanced,0.19645333290100098
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.01,0.08748160004615783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.01,0.07430400252342224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,balanced,0.9146293004353842
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,balanced,1.3869387308756511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.01,0.09143679738044738
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.01,0.07916799783706666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,balanced,0.24774932861328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.01,0.09639679789543151
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.01,0.08283519744873047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,power_law_1.01,0.060684800148010254
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.01,0.10534399747848511
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.01,0.08522239923477173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,power_law_1.01,0.07095040082931518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.01,0.11191680431365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.01,0.09403520226478576
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,power_law_1.01,0.08017280101776122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.01,0.11955840587615967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.01,0.09859840273857116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,power_law_1.01,0.055251199007034305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.01,0.10943360328674316
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,balanced,0.32603200276692706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.01,0.1367743968963623
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,power_law_1.01,0.06162559986114502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.01,0.12859519720077514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,power_law_1.01,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.01,0.14321279525756836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,16,16,power_law_1.2,0.07496320009231568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,power_law_1.01,0.07011200189590454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,balanced,1.1245013078053792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.01,0.13938560485839843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.01,0.17889280319213868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,16,16,power_law_1.2,0.0866047978401184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,power_law_1.01,0.07747840285301208
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.01,0.1738816022872925
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,balanced,0.44072532653808594
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.01,0.20865280628204347
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,power_law_1.01,0.07708160281181335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,16,16,power_law_1.2,0.07876480221748353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.01,0.20078721046447753
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,power_law_1.01,0.07835519909858704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.01,0.26800639629364015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,16,16,power_law_1.2,0.06626560091972351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.01,0.27192320823669436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,power_law_1.01,0.08238080143928528
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,16,16,power_law_1.2,0.0679040014743805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.01,0.302892804145813
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.01,0.32125439643859866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,power_law_1.01,0.08605440258979798
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,16,16,power_law_1.2,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,balanced,0.598693331082662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.01,0.41230077743530275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.01,0.44808320999145507
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,power_law_1.01,0.08942080140113831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,16,16,power_law_1.2,0.07468159794807434
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.01,0.5782527923583984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.01,0.5198272228240967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,power_law_1.01,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,16,16,power_law_1.2,0.082259202003479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.01,0.8462783813476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.01,0.7102272033691406
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,power_law_1.01,0.1052672028541565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,16,16,power_law_1.2,0.08311039805412293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.01,1.0465215682983398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,power_law_1.01,0.11221760511398315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.01,0.9875200271606446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,16,16,power_law_1.2,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,power_law_1.01,0.12124160528182984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,16,16,power_law_1.2,0.08663039803504943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.01,1.1578495979309082
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.01,1.4148608207702638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,balanced,0.8321812947591146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,power_law_1.01,0.14616960287094116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,16,16,power_law_1.2,0.08984320163726807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.01,1.9507776260375977
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.01,2.0914943695068358
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,16,16,power_law_1.2,0.08929920196533203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,balanced,1.7733173370361328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,power_law_1.01,0.1655295968055725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,16,16,power_law_1.2,0.09579520225524903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.01,3.817804718017578
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.01,4.205900955200195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,16,16,power_law_1.2,0.10551680326461792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,16,16,power_law_1.2,0.11418240070343018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,power_law_1.01,0.20475521087646484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,16,16,power_law_1.2,0.12268160581588745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,balanced,2.6684745152791343
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,power_law_1.01,0.24003839492797852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,16,16,power_law_1.2,0.13935999870300292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,power_law_1.01,0.35992960929870604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,16,16,power_law_1.2,0.1500607967376709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,16,16,power_law_1.2,0.1827455997467041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,balanced,1.1113759676615398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,16,16,power_law_1.2,0.23383040428161622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,power_law_1.01,0.4332096099853516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,16,16,power_law_1.2,0.2810431957244873
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,power_law_1.01,0.6372735977172852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,16,16,power_law_1.2,0.32383999824523924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,power_law_1.01,0.797433614730835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,16,16,power_law_1.2,0.49251837730407716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,power_law_1.01,1.2061311721801757
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,16,16,power_law_1.2,0.5776895999908447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,power_law_1.01,1.7797632217407227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,16,16,power_law_1.2,0.8564672470092773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,power_law_1.01,1.9940607070922851
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,16,16,power_law_1.2,1.0729727745056152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,balanced,1.3696266810099285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,16,16,power_law_1.2,1.2781567573547363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,power_law_1.01,3.114476776123047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,16,16,power_law_1.2,2.0738176345825194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,power_law_1.01,6.067193603515625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,16,16,power_law_1.2,4.670912170410157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,balanced,3.471712112426758
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,16,16,power_law_1.2,0.06096640229225159
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,balanced,2.138597329457601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,16,16,power_law_1.2,0.06880639791488648
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,16,16,power_law_1.2,0.05964159965515137
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,16,16,power_law_1.2,0.0567359983921051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,16,16,power_law_1.2,0.06559360027313232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,16,16,power_law_1.2,0.061561602354049685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,16,16,power_law_1.2,0.066975998878479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,16,16,power_law_1.2,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,16,16,power_law_1.2,0.07057279944419861
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,16,16,power_law_1.2,0.07253760099411011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,16,16,power_law_1.2,0.07408639788627625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,16,16,power_law_1.2,0.08013439774513245
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,16,16,power_law_1.2,0.08133119940757752
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,16,16,power_law_1.2,0.08350080251693726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,16,16,power_law_1.2,0.09772160053253173
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,16,16,power_law_1.2,0.10005760192871094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,16,16,power_law_1.2,0.1102463960647583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,16,16,power_law_1.2,0.13162879943847655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,16,16,power_law_1.2,0.14304640293121337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,16,16,power_law_1.2,0.18581119775772095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,16,16,power_law_1.2,0.20874879360198975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,balanced,4.193968137105306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,16,16,power_law_1.2,0.2776384115219116
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,16,16,power_law_1.2,0.35350399017333983
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,16,16,power_law_1.2,0.4933055877685547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,16,16,power_law_1.2,0.6183167934417725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,16,16,power_law_1.2,0.9647551536560058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,16,16,power_law_1.2,1.2170880317687989
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,16,16,power_law_1.2,1.53504638671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,16,16,power_law_1.2,2.3803583145141602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,16,16,power_law_1.2,5.114924621582031
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,balanced,0.05605866511662801
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,balanced,0.054885332783063255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,balanced,0.05693333347638448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1,7168,2048,8,384,16,16,power_law_1.2,0.061273598670959474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,balanced,0.048783997694651283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,balanced,0.060746664802233376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2,7168,2048,8,384,16,16,power_law_1.2,0.07008640170097351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,balanced,0.06897599995136261
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,balanced,0.04929600159327189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4,7168,2048,8,384,16,16,power_law_1.2,0.06038399934768677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,balanced,0.0960586667060852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,balanced,0.05086933573087057
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8,7168,2048,8,384,16,16,power_law_1.2,0.05808640122413635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,balanced,0.1129866639773051
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,balanced,0.05561066667238871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16,7168,2048,8,384,16,16,power_law_1.2,0.06195840239524841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,balanced,0.06169599791367849
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,balanced,0.10914132992426555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,balanced,0.08054933448632558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32,7168,2048,8,384,16,16,power_law_1.2,0.06522240042686463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,balanced,0.10877333084742229
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,balanced,0.09462933739026387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,balanced,0.1114026705423991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,48,7168,2048,8,384,16,16,power_law_1.2,0.06849920153617858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,balanced,0.09539733330408733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,balanced,0.09548800190289815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,balanced,0.11108799775441487
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,64,7168,2048,8,384,16,16,power_law_1.2,0.07674880027770996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,balanced,0.09723200400670369
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,80,7168,2048,8,384,16,16,power_law_1.2,0.07804800271987915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,balanced,0.11522666613260905
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,balanced,0.09943466385205586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,96,7168,2048,8,384,16,16,power_law_1.2,0.07776640057563781
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,balanced,0.11582932869593303
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,balanced,0.10083733002344768
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,balanced,0.1034986674785614
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,balanced,0.11442133784294128
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,128,7168,2048,8,384,16,16,power_law_1.2,0.081004798412323
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,balanced,0.10425066947937012
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,balanced,0.1234933336575826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,160,7168,2048,8,384,16,16,power_law_1.2,0.08617600202560424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,balanced,0.11331199606259663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,balanced,0.12281066179275513
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,192,7168,2048,8,384,16,16,power_law_1.2,0.08872320055961609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,balanced,0.11467732985814412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,balanced,0.12854400277137756
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,256,7168,2048,8,384,16,16,power_law_1.2,0.09528959989547729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,balanced,0.12173866232236226
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.01,0.06307200193405152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,320,7168,2048,8,384,16,16,power_law_1.2,0.10420479774475097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,balanced,0.14468266566594443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,balanced,0.13689066966374716
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,384,7168,2048,8,384,16,16,power_law_1.2,0.10897279977798462
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.01,0.06316159963607788
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,balanced,0.1590986649195353
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,balanced,0.1532586713631948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,512,7168,2048,8,384,16,16,power_law_1.2,0.12432639598846436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.01,0.08880640268325805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,768,7168,2048,8,384,16,16,power_law_1.2,0.16299519538879395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.01,0.062438398599624634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,balanced,0.1869279940923055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,balanced,0.18378132581710815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.01,0.06938239932060242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.01,0.05480319857597351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1024,7168,2048,8,384,16,16,power_law_1.2,0.18068480491638184
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,balanced,0.21870400508244833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,balanced,0.21451733509699503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.01,0.0863103985786438
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.01,0.05686399936676025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.01,0.08897280097007751
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.01,0.07498239874839782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,balanced,0.2760106722513835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.01,0.09493759870529175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.01,0.0574400007724762
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,balanced,0.2622346679369609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,1536,7168,2048,8,384,16,16,power_law_1.2,0.2236799955368042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.01,0.062489598989486694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.01,0.09702399969100953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,2048,7168,2048,8,384,16,16,power_law_1.2,0.28053760528564453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.01,0.10033279657363892
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.01,0.07237759828567505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,balanced,0.34591468175252277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,3072,7168,2048,8,384,16,16,power_law_1.2,0.4134208202362061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,balanced,0.32124267021814984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.01,0.10216319561004639
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.01,0.0769599974155426
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.01,0.11017600297927857
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.01,0.08335999846458435
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.01,0.11110399961471558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.01,0.08477439880371093
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,4096,7168,2048,8,384,16,16,power_law_1.2,0.48736000061035156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.01,0.10659199953079224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,balanced,0.4827680190404256
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.01,0.08684160113334656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,balanced,0.43917866547902423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.01,0.12175999879837036
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,6144,7168,2048,8,384,16,16,power_law_1.2,0.7565311908721923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.01,0.08707839846611024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.01,0.13148159980773927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,8192,7168,2048,8,384,16,16,power_law_1.2,0.9119487762451172
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.01,0.09178879857063293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.01,0.13419519662857055
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,12288,7168,2048,8,384,16,16,power_law_1.2,1.6261568069458008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.01,0.09285759925842285
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.01,0.15312000513076782
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,balanced,0.6231199900309244
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.01,0.10068479776382447
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.01,0.19615999460220337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,balanced,0.5532586574554443
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.01,0.11483520269393921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,16384,7168,2048,8,384,16,16,power_law_1.2,1.8323392868041992
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.01,0.24106240272521973
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.01,0.11886080503463745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.01,0.25112318992614746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,20480,7168,2048,8,384,16,16,power_law_1.2,2.4409536361694335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.01,0.12833280563354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.01,0.3236160039901733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.01,0.1523967981338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.01,0.3883136034011841
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,32768,7168,2048,8,384,16,16,power_law_1.2,4.053023910522461
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.01,0.1631872057914734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.01,0.5219264030456543
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,balanced,0.9009386698404948
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.01,0.20805759429931642
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.01,0.6739391803741455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,balanced,0.7895786762237549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.01,0.23240320682525634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8_block,65536,7168,2048,8,384,16,16,power_law_1.2,8.416473388671875
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.01,0.9595775604248047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.01,0.3171072006225586
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.01,1.2233920097351074
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.01,0.3845760107040405
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.01,1.4312383651733398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.01,0.5536960124969482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.01,2.232044792175293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.01,0.6948607921600342
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.01,4.448588943481445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.01,0.9906815528869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,balanced,1.137221336364746
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,balanced,0.9814453125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.01,1.2706624031066895
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.01,1.6121728897094727
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.01,2.483955192565918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.01,5.124972915649414
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,balanced,1.4093012809753418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,balanced,1.2097386519114177
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1,7168,2048,8,384,32,8,power_law_1.2,0.06353279948234558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2,7168,2048,8,384,32,8,power_law_1.2,0.06359040141105651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4,7168,2048,8,384,32,8,power_law_1.2,0.07383040189743043
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8,7168,2048,8,384,32,8,power_law_1.2,0.06304640173912049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16,7168,2048,8,384,32,8,power_law_1.2,0.06844159960746765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32,7168,2048,8,384,32,8,power_law_1.2,0.08318079710006714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,48,7168,2048,8,384,32,8,power_law_1.2,0.0861952006816864
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,64,7168,2048,8,384,32,8,power_law_1.2,0.09435520172119141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,80,7168,2048,8,384,32,8,power_law_1.2,0.0971455991268158
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,96,7168,2048,8,384,32,8,power_law_1.2,0.09746559858322143
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,128,7168,2048,8,384,32,8,power_law_1.2,0.10291839838027954
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,160,7168,2048,8,384,32,8,power_law_1.2,0.10891519784927368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,balanced,2.220991929372152
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,192,7168,2048,8,384,32,8,power_law_1.2,0.11367039680480957
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,256,7168,2048,8,384,32,8,power_law_1.2,0.1149440050125122
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,balanced,1.8985973993937175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,320,7168,2048,8,384,32,8,power_law_1.2,0.12175359725952148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,384,7168,2048,8,384,32,8,power_law_1.2,0.13150080442428588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,512,7168,2048,8,384,32,8,power_law_1.2,0.134662401676178
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,768,7168,2048,8,384,32,8,power_law_1.2,0.16254080533981324
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1024,7168,2048,8,384,32,8,power_law_1.2,0.19398399591445922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,1536,7168,2048,8,384,32,8,power_law_1.2,0.2545792102813721
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,2048,7168,2048,8,384,32,8,power_law_1.2,0.2688127994537354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,3072,7168,2048,8,384,32,8,power_law_1.2,0.34603519439697267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,4096,7168,2048,8,384,32,8,power_law_1.2,0.4143680095672607
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,6144,7168,2048,8,384,32,8,power_law_1.2,0.574451208114624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,8192,7168,2048,8,384,32,8,power_law_1.2,0.7779327869415283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,12288,7168,2048,8,384,32,8,power_law_1.2,1.0084223747253418
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,16384,7168,2048,8,384,32,8,power_law_1.2,1.2365504264831544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,20480,7168,2048,8,384,32,8,power_law_1.2,1.6339839935302733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,32768,7168,2048,8,384,32,8,power_law_1.2,2.4395072937011717
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,power_law_1.2,4.756991958618164
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,balanced,4.356911977132161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,float16,65536,7168,2048,8,384,32,8,balanced,3.6044801076253257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,balanced,0.043061330914497375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,balanced,0.04391466577847799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1,7168,2048,8,384,32,8,power_law_1.2,0.055257600545883176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,balanced,0.044112001856168113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,balanced,0.04885333279768626
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2,7168,2048,8,384,32,8,power_law_1.2,0.056467199325561525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,balanced,0.055642664432525635
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,balanced,0.06640533109505971
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4,7168,2048,8,384,32,8,power_law_1.2,0.05858560204505921
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,balanced,0.060496002435684204
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8,7168,2048,8,384,32,8,power_law_1.2,0.057785600423812866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,power_law_1.01,0.04196479916572571
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,balanced,0.060592000683148704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,power_law_1.01,0.04323840141296387
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,balanced,0.06844266752401988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16,7168,2048,8,384,32,8,power_law_1.2,0.06105599999427795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,power_law_1.01,0.04368639886379242
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,balanced,0.0699946681658427
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32,7168,2048,8,384,32,8,power_law_1.2,0.06762880086898804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,balanced,0.07122133175532024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,power_law_1.01,0.04657920002937317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,balanced,0.06692799925804138
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,power_law_1.01,0.04981119930744171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,48,7168,2048,8,384,32,8,power_law_1.2,0.07192959785461425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,balanced,0.06831466654936473
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,power_law_1.01,0.05740799903869629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,balanced,0.0690880020459493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,64,7168,2048,8,384,32,8,power_law_1.2,0.0793727993965149
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,power_law_1.01,0.05870720148086548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,balanced,0.06930666665236156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,80,7168,2048,8,384,32,8,power_law_1.2,0.08463360071182251
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,power_law_1.01,0.058336001634597776
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,balanced,0.07018133501211803
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,power_law_1.01,0.06729599833488464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,96,7168,2048,8,384,32,8,power_law_1.2,0.08446720242500305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,balanced,0.07066133121649425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,power_law_1.01,0.06711680293083191
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,128,7168,2048,8,384,32,8,power_law_1.2,0.08705919981002808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,balanced,0.07553599774837494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,power_law_1.01,0.06702079772949218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,160,7168,2048,8,384,32,8,power_law_1.2,0.09077759981155395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,balanced,0.07761066655317943
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,192,7168,2048,8,384,32,8,power_law_1.2,0.09168000221252441
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,power_law_1.01,0.06743040084838867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,balanced,0.0853706697622935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,256,7168,2048,8,384,32,8,power_law_1.2,0.1071679949760437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,power_law_1.01,0.06772480010986329
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,320,7168,2048,8,384,32,8,power_law_1.2,0.11764479875564575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,balanced,0.09664000074068706
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,power_law_1.01,0.06855679750442505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,384,7168,2048,8,384,32,8,power_law_1.2,0.1255295991897583
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,power_law_1.01,0.06926720142364502
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,balanced,0.1122773289680481
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,512,7168,2048,8,384,32,8,power_law_1.2,0.13024640083312988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,power_law_1.01,0.06963840126991272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,768,7168,2048,8,384,32,8,power_law_1.2,0.1555456042289734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,power_law_1.01,0.07184640169143677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,balanced,0.12797333796819052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,2,128,power_law_1.2,0.04222080111503601
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,power_law_1.01,0.07760000228881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1024,7168,2048,8,384,32,8,power_law_1.2,0.1682752013206482
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,power_law_1.01,0.07916160225868225
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,2,128,power_law_1.2,0.04349440038204193
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,1536,7168,2048,8,384,32,8,power_law_1.2,0.22447359561920166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,balanced,0.16146133343378702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,power_law_1.01,0.08880000114440918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,2,128,power_law_1.2,0.04258559942245484
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,2048,7168,2048,8,384,32,8,power_law_1.2,0.2524991989135742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,power_law_1.01,0.09866880178451538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,2,128,power_law_1.2,0.046758401393890384
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,power_law_1.01,0.15656319856643677
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,3072,7168,2048,8,384,32,8,power_law_1.2,0.32635519504547117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,balanced,0.20085332791010538
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,2,128,power_law_1.2,0.04954879879951477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,power_law_1.01,0.17466239929199218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,4096,7168,2048,8,384,32,8,power_law_1.2,0.4218431949615479
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,2,128,power_law_1.2,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,power_law_1.01,0.2471679925918579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,power_law_1.01,0.33029119968414306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,6144,7168,2048,8,384,32,8,power_law_1.2,0.5909440040588378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,2,128,power_law_1.2,0.05794559717178345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,balanced,0.2863466739654541
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,2,128,power_law_1.2,0.057843202352523805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,8192,7168,2048,8,384,32,8,power_law_1.2,0.7499008178710938
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,power_law_1.01,0.47095041275024413
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,2,128,power_law_1.2,0.06714879870414733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,12288,7168,2048,8,384,32,8,power_law_1.2,1.1570112228393554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,power_law_1.01,0.6905792236328125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,2,128,power_law_1.2,0.06716160178184509
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,power_law_1.01,0.8167743682861328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,16384,7168,2048,8,384,32,8,power_law_1.2,1.471840000152588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,2,128,power_law_1.2,0.0676800012588501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,balanced,0.37265066305796307
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,power_law_1.01,1.2949824333190918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,2,128,power_law_1.2,0.06738560199737549
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,20480,7168,2048,8,384,32,8,power_law_1.2,1.8392192840576171
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,2,128,power_law_1.2,0.06803839802742004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,power_law_1.01,2.6469951629638673
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,2,128,power_law_1.2,0.06913920044898987
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,32768,7168,2048,8,384,32,8,power_law_1.2,2.9443071365356444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,2,128,power_law_1.2,0.06944640278816223
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,2,128,power_law_1.2,0.06970880031585694
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,balanced,0.03316800047953924
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,balanced,0.4609866539637248
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,fp8,65536,7168,2048,8,384,32,8,power_law_1.2,6.216147232055664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,2,128,power_law_1.2,0.0719488024711609
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,balanced,0.03402133285999298
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,2,128,power_law_1.2,0.07625600099563598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,2,128,power_law_1.2,0.0788927972316742
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,balanced,0.03719999889532725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,2,128,power_law_1.2,0.09898880124092102
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,balanced,0.0405173326532046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,2,128,power_law_1.2,0.14179840087890624
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,balanced,0.045663997530937195
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,2,128,power_law_1.2,0.17797759771347046
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,balanced,0.05388799806435903
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,2,128,power_law_1.2,0.23494400978088378
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,balanced,0.7211519877115885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,balanced,0.05385600030422211
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,power_law_1.2,0.03304319977760315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,4,64,power_law_1.01,0.03309440016746521
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,2,128,power_law_1.2,0.35048320293426516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,balanced,0.054645334680875145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,power_law_1.2,0.033657601475715636
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,4,64,power_law_1.01,0.03373439908027649
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,balanced,0.056373332937558494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,2,128,power_law_1.2,0.4361855983734131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,power_law_1.2,0.03304319977760315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,4,64,power_law_1.01,0.033369600772857666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,balanced,0.05665599803129832
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,2,128,power_law_1.2,0.698956823348999
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,balanced,0.05382933219273885
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,power_law_1.2,0.03697279989719391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,4,64,power_law_1.01,0.037376001477241516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,balanced,0.06063466767470042
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,2,128,power_law_1.2,0.9713472366333008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,4,64,power_law_1.01,0.040870401263237
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,balanced,0.06030400097370148
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,power_law_1.2,0.04323199987411499
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,4,64,power_law_1.01,0.04360319972038269
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,2,128,power_law_1.2,1.3122431755065918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,balanced,0.060693333546320595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,power_law_1.2,0.05082240104675293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,4,64,power_law_1.01,0.05309439897537231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,2,128,power_law_1.2,1.8262271881103516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,balanced,0.06095466514428457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,4,64,power_law_1.01,0.05148800015449524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,power_law_1.2,0.05060480237007141
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,power_law_1.2,4.869286346435547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,balanced,0.06205333272616068
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,4,64,power_law_1.01,0.050342398881912234
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,power_law_1.2,0.05070080161094666
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,4,64,power_law_1.01,0.050310397148132326
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,balanced,0.06595199803511302
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,power_law_1.2,0.0525056004524231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,4,64,power_law_1.01,0.05234559774398804
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,power_law_1.2,0.05284479856491089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,balanced,0.0687253326177597
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,4,64,power_law_1.01,0.05301759839057922
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,power_law_1.2,0.058911997079849246
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,balanced,0.07760000228881836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,2,128,balanced,1.4140480359395344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,power_law_1.2,0.0596671998500824
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,4,64,power_law_1.01,0.05889279842376709
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,power_law_1.2,0.060102397203445436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,balanced,0.08788266777992249
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,4,64,power_law_1.01,0.05930240154266357
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,power_law_1.2,0.06043519973754883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,balanced,0.10412266850471497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,4,64,power_law_1.01,0.059411197900772095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,power_law_1.2,0.06263039708137512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,power_law_1.2,0.06807680130004883
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,4,64,power_law_1.01,0.060070401430130003
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,balanced,0.1225493351618449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,power_law_1.2,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,4,64,power_law_1.01,0.06217600107192993
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,power_law_1.2,0.08889600038528442
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,4,64,power_law_1.01,0.06687999963760376
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,balanced,0.16192000110944113
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,power_law_1.2,0.10012799501419067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,power_law_1.2,0.14393600225448608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,4,64,power_law_1.01,0.07036799788475037
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,power_law_1.2,0.18183679580688478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,balanced,0.19653334220250449
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,4,64,power_law_1.01,0.08380799889564514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,power_law_1.2,0.24858241081237792
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,4,64,power_law_1.01,0.09621120095252991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,power_law_1.2,0.3605760097503662
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,4,64,power_law_1.01,0.11747200489044189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,power_law_1.2,0.49567360877990724
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,4,64,power_law_1.01,0.14863359928131104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,balanced,0.2767573396364848
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,power_law_1.2,0.6746367931365966
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,power_law_1.2,0.8150783538818359
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,4,64,power_law_1.01,0.2127295970916748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,4,64,power_law_1.01,0.26023681163787843
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,power_law_1.2,1.4553983688354493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,4,64,power_law_1.01,0.41904640197753906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,power_law_1.2,3.202163314819336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,balanced,0.3588320016860962
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,4,64,power_law_1.01,0.5228288173675537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,power_law_1.01,0.6396416187286377
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,power_law_1.01,1.0761856079101562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,power_law_1.01,2.057209587097168
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,4,64,balanced,0.4432320197423299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,balanced,0.030437332888444264
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,balanced,0.03166399896144867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,balanced,0.03190933416287104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,4,64,balanced,0.6905386447906494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,balanced,0.03370666752258936
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,balanced,0.03741333385308584
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,balanced,0.03994133323431015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,balanced,0.04277333120505015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,balanced,0.04513599971930186
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,balanced,0.04877333343029022
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,balanced,0.048751999934514366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,balanced,0.050250664353370667
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,balanced,0.048010667165120445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,balanced,0.049125333627065025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,balanced,0.049600000182787575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,balanced,0.0517493337392807
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,balanced,0.05804799993832906
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,4,64,balanced,1.3586667378743489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,balanced,0.05907199780146281
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,8,32,power_law_1.01,0.031027200818061828
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,balanced,0.0621066689491272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,power_law_1.2,0.0321152001619339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,8,32,power_law_1.01,0.03209599852561951
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,balanced,0.06459199885527293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,power_law_1.01,0.030675199627876282
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,8,32,power_law_1.2,0.030649599432945252
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,power_law_1.01,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,balanced,0.07601066430409749
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,8,32,power_law_1.2,0.034195199608802795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,power_law_1.01,0.035673600435256955
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,power_law_1.01,0.03815680146217346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,balanced,0.08675733208656311
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,8,32,power_law_1.2,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,power_law_1.01,0.042361599206924436
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,power_law_1.01,0.04312959909439087
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,8,32,power_law_1.2,0.0377920001745224
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,balanced,0.1050879955291748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,power_law_1.01,0.04835200011730194
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,8,32,power_law_1.2,0.042233601212501526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,power_law_1.01,0.048665601015090945
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,power_law_1.01,0.049721598625183105
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,balanced,0.12330666184425354
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,8,32,power_law_1.2,0.04307839870452881
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,8,32,power_law_1.2,0.047142401337623596
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,power_law_1.01,0.04878720045089722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,balanced,0.1651893357435862
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,8,32,power_law_1.2,0.04755840003490448
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,power_law_1.01,0.052275198698043826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,power_law_1.01,0.05309439897537231
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,8,32,power_law_1.2,0.048416000604629514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,balanced,0.027744000156720478
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,power_law_1.01,0.058745598793029784
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,8,32,power_law_1.2,0.050470399856567386
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,balanced,0.02938666691382726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,balanced,0.19981332619984946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,power_law_1.01,0.06053119897842407
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,8,32,power_law_1.2,0.04912639856338501
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,balanced,0.029658667743206024
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,power_law_1.01,0.06458240151405334
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,balanced,0.032245332996050514
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,8,32,power_law_1.2,0.051577597856521606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,power_law_1.01,0.07008000016212464
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,balanced,0.03451200077931086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,8,32,power_law_1.2,0.05303040146827698
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,power_law_1.01,0.08231679797172546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,balanced,0.27340267101923627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,balanced,0.03453333427508672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,8,32,power_law_1.2,0.06007680296897888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,power_law_1.01,0.09465600252151489
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,balanced,0.038021333515644073
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,8,32,power_law_1.2,0.06004480123519897
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,power_law_1.01,0.1185215950012207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,8,32,power_law_1.2,0.06709120273590088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,power_law_1.01,0.14247039556503296
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,8,32,power_law_1.2,0.07392640113830566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,balanced,0.35237332185109455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,balanced,0.042463997999827065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,power_law_1.01,0.19635839462280275
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,power_law_1.01,0.02855679988861084
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,balanced,0.040234667559464775
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,8,32,power_law_1.2,0.0849727988243103
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,power_law_1.01,0.25408000946044923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,balanced,0.05373866856098175
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,power_law_1.01,0.03270399868488312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,8,32,power_law_1.2,0.09998720288276672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,power_law_1.01,0.3714047908782959
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,balanced,0.05500266452630361
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,power_law_1.01,0.02993279993534088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,8,32,power_law_1.2,0.12386560440063477
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,power_law_1.01,0.4831808090209961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,balanced,0.0497920016447703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,power_law_1.01,0.0328575998544693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,8,32,power_law_1.2,0.1638975977897644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,balanced,0.43319467703501385
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,balanced,0.051728000243504844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,power_law_1.01,0.5756351947784424
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,power_law_1.01,0.03447040021419525
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,8,32,power_law_1.2,0.21729280948638915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,balanced,0.05474133292833964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,power_law_1.01,0.9198143959045411
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,power_law_1.01,0.03363839983940124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,8,32,power_law_1.2,0.3000063896179199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,balanced,0.056799997886021934
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,power_law_1.01,1.8887872695922852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,balanced,0.06613333523273468
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,8,32,power_law_1.2,0.4290304183959961
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,power_law_1.01,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,balanced,0.06890666484832764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,8,32,power_law_1.2,0.5879104137420654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,power_law_1.01,0.04105600118637085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,balanced,0.08123200138409932
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,8,32,power_law_1.2,0.6985983848571777
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,power_law_1.01,0.041177600622177124
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,balanced,0.09052800138791402
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,power_law_1.2,1.0732671737670898
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,8,32,balanced,0.68012801806132
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,16,16,power_law_1.2,0.028863999247550964
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,power_law_1.01,0.039289599657058714
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,balanced,0.10897066195805867
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,power_law_1.2,2.361248016357422
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,16,16,power_law_1.2,0.032543998956680295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,power_law_1.01,0.0536191999912262
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,balanced,0.1274133324623108
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,16,16,power_law_1.2,0.02937600016593933
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,power_law_1.01,0.05491200089454651
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,16,16,power_law_1.2,0.0326335996389389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,balanced,0.17166399955749512
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,power_law_1.01,0.0522816002368927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,16,16,power_law_1.2,0.03380480110645294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,16,16,power_law_1.2,0.03315199911594391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,power_law_1.01,0.05295360088348389
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,balanced,0.20667733748753866
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,power_law_1.01,0.057734400033950806
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,16,16,power_law_1.2,0.03754239976406097
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,balanced,0.02735999971628189
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,power_law_1.01,0.05921919941902161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,16,16,power_law_1.2,0.0363072007894516
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,balanced,0.028783999383449554
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,power_law_1.01,0.07034879922866821
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,balanced,0.2830666700998942
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,16,16,power_law_1.2,0.04051840007305145
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,power_law_1.01,0.07336959838867188
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,balanced,0.02869333326816559
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,balanced,0.03190933416287104
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,16,16,power_law_1.2,0.0418368011713028
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,power_law_1.01,0.08725119829177856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,power_law_1.01,0.09687680006027222
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,8,32,balanced,1.3289653460184734
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,balanced,0.03339199970165888
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,16,16,power_law_1.2,0.04023039937019348
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,power_law_1.01,0.12130559682846069
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,balanced,0.03544000039498011
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,balanced,0.3686506748199463
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,16,16,power_law_1.2,0.05353599786758423
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,power_law_1.01,0.1457152009010315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,balanced,0.03638399889071783
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,power_law_1.01,0.2131648063659668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,16,16,power_law_1.2,0.05414400100708008
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,balanced,0.03498133271932602
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,power_law_1.01,0.25319681167602537
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,16,16,power_law_1.2,0.05192959904670715
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,power_law_1.01,0.36608641147613524
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,balanced,0.03938133269548416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,16,16,power_law_1.2,0.0531711995601654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,power_law_1.01,0.46625280380249023
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,balanced,0.03807999938726425
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,balanced,0.4606826702753703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,power_law_1.01,0.5724095821380615
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,16,16,power_law_1.2,0.05914239883422852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,balanced,0.03716266651948293
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,power_law_1.01,0.9092991828918457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,16,16,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,balanced,0.043680002291997276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,power_law_1.01,1.8879295349121095
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,16,16,power_law_1.2,0.07180799841880799
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,balanced,0.044794668753941856
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,balanced,0.042170668641726174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,16,16,power_law_1.2,0.07688959836959838
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,balanced,0.057301332553227745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,16,16,power_law_1.2,0.08936960101127625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,balanced,0.05773333211739858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,16,16,power_law_1.2,0.1004480004310608
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,balanced,0.7077120145161947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,balanced,0.05550933380921682
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,16,16,power_law_1.2,0.12257280349731445
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,16,16,power_law_1.2,0.15730559825897217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,balanced,0.06586666901906331
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,power_law_1.01,0.02791680097579956
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,16,16,power_law_1.2,0.21471359729766845
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,balanced,0.07107200225194295
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,power_law_1.01,0.02948479950428009
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,16,16,power_law_1.2,0.2917056083679199
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,balanced,0.0867680013179779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,power_law_1.01,0.030329599976539612
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,16,16,power_law_1.2,0.40514559745788575
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,balanced,0.09593600034713745
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,power_law_1.01,0.031513598561286923
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,16,16,power_law_1.2,0.5188992023468018
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,power_law_1.01,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,balanced,0.11485866705576579
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,power_law_1.01,0.03395200073719025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,16,16,power_law_1.2,0.7233215808868408
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,balanced,0.13375999530156454
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,power_law_1.01,0.03521279990673065
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,16,16,power_law_1.2,1.0182016372680665
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,power_law_1.01,0.03433600068092346
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,power_law_1.2,2.025267219543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,balanced,0.18254933754603067
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,16,16,balanced,1.387056032816569
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,power_law_1.01,0.03765760064125061
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,power_law_1.01,0.036108800768852235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,balanced,0.21874133745829263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,power_law_1.01,0.043584001064300534
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,power_law_1.01,0.043635201454162595
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,power_law_1.01,0.041766399145126344
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,balanced,0.30112000306447345
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,power_law_1.01,0.05726079940795899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,power_law_1.01,0.05937280058860779
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,power_law_1.01,0.057868802547454835
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,balanced,0.39101866881052655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,power_law_1.01,0.0686784029006958
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,power_law_1.01,0.07272959947586059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,power_law_1.01,0.09157119989395142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,power_law_1.01,0.10160640478134156
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,power_law_1.01,0.1238592028617859
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,balanced,0.49385066827138263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,power_law_1.01,0.1502527952194214
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,power_law_1.01,0.19935359954833984
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,power_law_1.01,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,power_law_1.01,0.37620480060577394
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,power_law_1.01,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,128,32,8,power_law_1.2,0.027795198559761047
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,power_law_1.01,0.5993152141571045
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,128,32,8,power_law_1.2,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,balanced,0.7476533253987631
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,power_law_1.01,0.9245311737060546
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,128,32,8,power_law_1.2,0.028512001037597656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,128,32,8,power_law_1.2,0.03166080117225647
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,power_law_1.01,1.780499267578125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,128,32,8,power_law_1.2,0.032671999931335446
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,balanced,0.02903999884923299
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,128,32,8,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,balanced,0.030202666918436687
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,balanced,0.03035199890534083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,128,32,8,power_law_1.2,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,balanced,0.03345600018898646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,128,32,8,power_law_1.2,0.034297600388526917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,balanced,0.036346666514873505
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,128,32,8,power_law_1.2,0.03731839954853058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,balanced,0.04106133431196213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,128,32,8,power_law_1.2,0.037510401010513304
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,balanced,0.04197333256403605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,128,32,8,power_law_1.2,0.03633280098438263
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,balanced,0.04195199906826019
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,128,32,8,power_law_1.2,0.043347200751304625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,balanced,0.04200533529122671
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,128,32,8,power_law_1.2,0.043628799915313723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,balanced,1.462997277577718
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,balanced,0.04211199780305227
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,128,32,8,power_law_1.2,0.042982399463653564
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,balanced,0.04256533086299896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,128,32,8,power_law_1.2,0.055904000997543335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,128,32,8,power_law_1.2,0.06048640012741089
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,128,32,8,power_law_1.2,0.058924800157546996
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,balanced,0.04261333247025808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,128,32,8,power_law_1.2,0.07182719707489013
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,power_law_1.01,0.02871040105819702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,balanced,0.04486933350563049
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,128,32,8,power_law_1.2,0.07883520126342773
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,power_law_1.01,0.029721599817276
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,balanced,0.04771733283996582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,128,32,8,power_law_1.2,0.09218559861183166
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,power_law_1.01,0.029580798745155335
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,balanced,0.048901334404945374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,power_law_1.01,0.032678401470184325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,128,32,8,power_law_1.2,0.10329600572586059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,power_law_1.01,0.03482879996299744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,balanced,0.05502399802207947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,128,32,8,power_law_1.2,0.12933759689331054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,8,32,power_law_1.2,0.028409600257873535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,balanced,0.05659733215967814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,128,32,8,power_law_1.2,0.1518272042274475
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,8,32,power_law_1.2,0.029177600145339967
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,balanced,0.05910933514436086
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,128,32,8,power_law_1.2,0.2206399917602539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,power_law_1.01,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,8,32,power_law_1.2,0.02913280129432678
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,balanced,0.06091733276844025
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,128,32,8,power_law_1.2,0.28460159301757815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,power_law_1.01,0.04223999977111816
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,8,32,power_law_1.2,0.032646399736404416
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,balanced,0.06926933427651723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,128,32,8,power_law_1.2,0.41125760078430174
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,power_law_1.01,0.04214400053024292
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,8,32,power_law_1.2,0.035071998834609985
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,power_law_1.01,0.04257920086383819
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,128,32,8,power_law_1.2,0.5410816192626953
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,balanced,0.07794133325417836
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,8,32,power_law_1.2,0.041094401478767396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,power_law_1.01,0.04335359930992126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,128,32,8,power_law_1.2,0.6372543811798096
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,power_law_1.01,0.044889599084854126
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,balanced,0.09962133566538493
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,8,32,power_law_1.2,0.041068801283836366
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,128,32,8,power_law_1.2,0.9498751640319825
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,power_law_1.01,0.04826880097389221
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,8,32,power_law_1.2,0.04131839871406555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,balanced,0.11947199702262878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,power_law_1.01,0.049184000492095946
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,128,32,8,power_law_1.2,1.9443967819213868
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,8,32,power_law_1.2,0.04123519957065582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,power_law_1.01,0.05562880039215088
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,8,32,power_law_1.2,0.041536000370979306
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,power_law_1.01,0.05716480016708374
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,balanced,0.15678399801254272
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,8,32,power_law_1.2,0.04222719967365265
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,power_law_1.01,0.061401599645614625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,8,32,power_law_1.2,0.042905598878860474
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,power_law_1.01,0.06947199702262878
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,balanced,0.026901334524154663
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,balanced,0.19338667392730713
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,8,32,power_law_1.2,0.044409599900245664
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,power_law_1.01,0.0857151985168457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,balanced,0.0281333327293396
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,8,32,power_law_1.2,0.04792959988117218
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,power_law_1.01,0.027289599180221558
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,balanced,0.028570666909217834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,power_law_1.01,0.09633280038833618
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,8,32,power_law_1.2,0.04878720045089722
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,balanced,0.030991998811562855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,power_law_1.01,0.12922240495681764
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,power_law_1.01,0.028019198775291444
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,balanced,0.263973335425059
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,balanced,0.033146666983763375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,8,32,power_law_1.2,0.05511040091514587
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,power_law_1.01,0.1739135980606079
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,balanced,0.03437866767247518
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,power_law_1.01,0.027859199047088622
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,8,32,power_law_1.2,0.056383997201919556
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,balanced,0.04033066580692927
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,power_law_1.01,0.23315200805664063
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,power_law_1.01,0.030559998750686646
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,balanced,0.03979733337958654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,8,32,power_law_1.2,0.06533759832382202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,power_law_1.01,0.32760961055755616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,power_law_1.01,0.03219839930534363
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,balanced,0.039813332259655
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,balanced,0.03985599925120672
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,8,32,power_law_1.2,0.0689791977405548
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,balanced,0.34139732519785565
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,power_law_1.01,0.4509376049041748
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,power_law_1.01,0.034041601419448855
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,balanced,0.04031466692686081
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,8,32,power_law_1.2,0.08871039748191833
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,power_law_1.01,0.03945600092411041
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,power_law_1.01,0.5871615886688233
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,balanced,0.03942933430274328
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,8,32,power_law_1.2,0.09804800152778625
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,power_law_1.01,0.03976320028305054
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,balanced,0.041296000281969704
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,power_law_1.01,0.7293759822845459
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,balanced,0.04158399999141693
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,power_law_1.01,0.0403328001499176
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,8,32,power_law_1.2,0.14419200420379638
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,power_law_1.01,1.1500736236572267
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,balanced,0.043866669138272606
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,power_law_1.01,0.040115201473236085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,8,32,power_law_1.2,0.18142720460891723
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,balanced,0.4210826555887858
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,balanced,0.047050664822260536
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,power_law_1.01,2.2854080200195312
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,power_law_1.01,0.039801600575447085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,8,32,power_law_1.2,0.25824000835418703
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,balanced,0.0491839994986852
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,power_law_1.01,0.040729600191116336
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,balanced,0.05807466804981232
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,8,32,power_law_1.2,0.32430078983306887
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,power_law_1.01,0.04056960046291351
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,balanced,0.05966933568318685
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,8,32,power_law_1.2,0.4753920078277588
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,power_law_1.01,0.041920000314712526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,balanced,0.07155199845631917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,8,32,power_law_1.2,0.6216896057128907
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,power_law_1.01,0.044537600874900815
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,balanced,0.0813973347345988
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,8,32,power_law_1.2,0.7754687786102294
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,power_law_1.01,0.04795520007610321
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,balanced,0.6605653365453085
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,balanced,0.10331199566523235
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,8,32,power_law_1.2,1.2192255973815918
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,power_law_1.01,0.05121279954910278
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,power_law_1.01,0.0638592004776001
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,balanced,0.12321066856384277
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,power_law_1.2,2.4040128707885744
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,power_law_1.01,0.06787840127944947
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,balanced,0.1623146633307139
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,power_law_1.01,0.0812991976737976
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,power_law_1.01,0.09693440198898315
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,power_law_1.01,0.1241536021232605
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,balanced,0.20056533813476562
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,16,16,power_law_1.2,0.027500799298286437
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,power_law_1.01,0.16732800006866455
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,16,16,power_law_1.2,0.027558401226997375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,power_law_1.01,0.23464319705963135
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,16,16,power_law_1.2,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,power_law_1.01,0.30122239589691163
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,balanced,0.2752426664034526
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,16,16,power_law_1.2,0.03038719892501831
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,power_law_1.01,0.44727039337158203
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,16,16,power_law_1.2,0.03196159899234772
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,power_law_1.01,0.5474239826202393
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,16,16,power_law_1.2,0.03410559892654419
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,balanced,0.35728001594543457
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,power_law_1.01,0.7767615795135498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,8,32,balanced,1.2988746960957844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,16,16,power_law_1.2,0.03935360014438629
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,power_law_1.01,1.098528003692627
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,16,16,power_law_1.2,0.039552000164985654
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,16,16,power_law_1.2,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,power_law_1.01,2.330124855041504
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,16,16,power_law_1.2,0.04017919898033142
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,balanced,0.44859735171000165
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,16,16,power_law_1.2,0.040191999077796935
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,16,16,power_law_1.2,0.040428799390792844
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,16,16,power_law_1.2,0.04079360067844391
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,balanced,0.026533332963784535
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,balanced,0.027632000545660656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,16,16,power_law_1.2,0.04207360148429871
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,balanced,0.028042666614055634
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,16,16,power_law_1.2,0.0447488009929657
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,balanced,0.031023999055226643
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,balanced,0.03204799940188726
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,16,16,power_law_1.2,0.048153600096702574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,balanced,0.03233066697915395
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,balanced,0.692799965540568
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,balanced,0.03486400097608566
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,16,16,power_law_1.2,0.05280640125274658
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,balanced,0.03470933437347412
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,16,16,power_law_1.2,0.06479359865188598
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,balanced,0.038015998899936676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,16,16,power_law_1.2,0.07000319957733155
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,balanced,0.03841066608826319
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,balanced,0.03889599939187368
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,16,16,power_law_1.2,0.08717439770698547
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,16,16,power_law_1.2,0.09884799718856811
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,balanced,0.03956266740957896
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,balanced,0.039706667264302574
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,16,16,power_law_1.2,0.1383936047554016
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,balanced,0.04087999959786733
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,16,16,power_law_1.2,0.2005376100540161
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,balanced,0.043653334180514015
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,16,16,power_law_1.2,0.27806079387664795
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,balanced,0.0513866643110911
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,16,16,power_law_1.2,0.3377919912338257
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,balanced,0.05516799787680308
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,16,16,power_law_1.2,0.6001344203948975
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,balanced,0.07521066566308339
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,balanced,0.08470933636029561
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,16,16,power_law_1.2,0.7009856224060058
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,balanced,0.10748799641927083
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,16,16,power_law_1.2,0.9654272079467774
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,balanced,1.3557920455932617
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,balanced,0.12774399916330972
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,16,16,power_law_1.2,1.5064319610595702
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,16,16,power_law_1.2,2.869107246398926
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,balanced,0.17003200451533
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,power_law_1.01,0.02622080147266388
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,power_law_1.01,0.0268095999956131
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,balanced,0.2111519972483317
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,power_law_1.01,0.0271807998418808
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,power_law_1.01,0.029600000381469725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,power_law_1.01,0.03073279857635498
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,balanced,0.2918826738993327
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,power_law_1.01,0.03237119913101196
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,power_law_1.01,0.034169599413871765
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,power_law_1.01,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,power_law_1.01,0.03774079978466034
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,balanced,0.3776479959487915
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,power_law_1.01,0.038227200508117676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,power_law_1.01,0.03927040100097656
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,power_law_1.01,0.03958399891853333
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,power_law_1.01,0.03925119936466217
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,power_law_1.01,0.04000000059604645
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,power_law_1.01,0.04099839925765991
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,balanced,0.47860264778137207
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,power_law_1.01,0.04530560076236725
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1,2880,2880,4,32,32,8,power_law_1.2,0.026655998826026917
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,power_law_1.01,0.04728319942951202
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,power_law_1.01,0.05726079940795899
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2,2880,2880,4,32,32,8,power_law_1.2,0.027539199590682982
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,power_law_1.01,0.06202239990234375
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4,2880,2880,4,32,32,8,power_law_1.2,0.02874239981174469
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,power_law_1.01,0.08361600041389465
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,power_law_1.01,0.09646080136299133
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8,2880,2880,4,32,32,8,power_law_1.2,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,power_law_1.01,0.1218559980392456
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,power_law_1.01,0.1554304003715515
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16,2880,2880,4,32,32,8,power_law_1.2,0.030796799063682555
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,power_law_1.01,0.20385279655456542
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,balanced,0.7287466526031494
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32,2880,2880,4,32,32,8,power_law_1.2,0.032179200649261476
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,power_law_1.01,0.2756608009338379
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,48,2880,2880,4,32,32,8,power_law_1.2,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,power_law_1.01,0.4163968086242676
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,64,2880,2880,4,32,32,8,power_law_1.2,0.034534400701522826
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,power_law_1.01,0.5661183834075928
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,80,2880,2880,4,32,32,8,power_law_1.2,0.0389055997133255
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,power_law_1.01,0.7062143802642822
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,96,2880,2880,4,32,32,8,power_law_1.2,0.03863039910793305
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,power_law_1.01,1.08985595703125
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,128,2880,2880,4,32,32,8,power_law_1.2,0.039852800965309146
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,power_law_1.01,2.261235237121582
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,160,2880,2880,4,32,32,8,power_law_1.2,0.03956480026245117
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,192,2880,2880,4,32,32,8,power_law_1.2,0.040524798631668094
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,256,2880,2880,4,32,32,8,power_law_1.2,0.04296959936618805
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,320,2880,2880,4,32,32,8,power_law_1.2,0.04286080002784729
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,384,2880,2880,4,32,32,8,power_law_1.2,0.0462336003780365
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,512,2880,2880,4,32,32,8,power_law_1.2,0.04913919866085052
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,balanced,1.4268372853597004
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,768,2880,2880,4,32,32,8,power_law_1.2,0.058143997192382814
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1024,2880,2880,4,32,32,8,power_law_1.2,0.06266239881515503
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,1536,2880,2880,4,32,32,8,power_law_1.2,0.08490880131721497
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,2048,2880,2880,4,32,32,8,power_law_1.2,0.09648000001907349
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,3072,2880,2880,4,32,32,8,power_law_1.2,0.13508479595184325
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,4096,2880,2880,4,32,32,8,power_law_1.2,0.17966079711914062
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,6144,2880,2880,4,32,32,8,power_law_1.2,0.2705600023269653
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,8192,2880,2880,4,32,32,8,power_law_1.2,0.3316351890563965
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,12288,2880,2880,4,32,32,8,power_law_1.2,0.5047808170318604
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,16384,2880,2880,4,32,32,8,power_law_1.2,0.6374911785125732
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,20480,2880,2880,4,32,32,8,power_law_1.2,0.8658304214477539
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,32768,2880,2880,4,32,32,8,power_law_1.2,1.3277119636535644
TRTLLM,1.2.0rc5,NVIDIA H100 80GB HBM3,moe,moe_torch_flow,w4a16_mxfp4,65536,2880,2880,4,32,32,8,power_law_1.2,2.875481605529785
